162306a36Sopenharmony_ci/* 262306a36Sopenharmony_ci * Copyright (c) 2004 Topspin Communications. All rights reserved. 362306a36Sopenharmony_ci * Copyright (c) 2005 Cisco Systems. All rights reserved. 462306a36Sopenharmony_ci * Copyright (c) 2005 Mellanox Technologies. All rights reserved. 562306a36Sopenharmony_ci * Copyright (c) 2004 Voltaire, Inc. All rights reserved. 662306a36Sopenharmony_ci * 762306a36Sopenharmony_ci * This software is available to you under a choice of one of two 862306a36Sopenharmony_ci * licenses. You may choose to be licensed under the terms of the GNU 962306a36Sopenharmony_ci * General Public License (GPL) Version 2, available from the file 1062306a36Sopenharmony_ci * COPYING in the main directory of this source tree, or the 1162306a36Sopenharmony_ci * OpenIB.org BSD license below: 1262306a36Sopenharmony_ci * 1362306a36Sopenharmony_ci * Redistribution and use in source and binary forms, with or 1462306a36Sopenharmony_ci * without modification, are permitted provided that the following 1562306a36Sopenharmony_ci * conditions are met: 1662306a36Sopenharmony_ci * 1762306a36Sopenharmony_ci * - Redistributions of source code must retain the above 1862306a36Sopenharmony_ci * copyright notice, this list of conditions and the following 1962306a36Sopenharmony_ci * disclaimer. 2062306a36Sopenharmony_ci * 2162306a36Sopenharmony_ci * - Redistributions in binary form must reproduce the above 2262306a36Sopenharmony_ci * copyright notice, this list of conditions and the following 2362306a36Sopenharmony_ci * disclaimer in the documentation and/or other materials 2462306a36Sopenharmony_ci * provided with the distribution. 2562306a36Sopenharmony_ci * 2662306a36Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 2762306a36Sopenharmony_ci * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 2862306a36Sopenharmony_ci * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 2962306a36Sopenharmony_ci * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 3062306a36Sopenharmony_ci * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 3162306a36Sopenharmony_ci * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 3262306a36Sopenharmony_ci * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 3362306a36Sopenharmony_ci * SOFTWARE. 3462306a36Sopenharmony_ci */ 3562306a36Sopenharmony_ci 3662306a36Sopenharmony_ci#include <linux/string.h> 3762306a36Sopenharmony_ci#include <linux/slab.h> 3862306a36Sopenharmony_ci#include <linux/sched.h> 3962306a36Sopenharmony_ci 4062306a36Sopenharmony_ci#include <asm/io.h> 4162306a36Sopenharmony_ci 4262306a36Sopenharmony_ci#include <rdma/ib_verbs.h> 4362306a36Sopenharmony_ci#include <rdma/ib_cache.h> 4462306a36Sopenharmony_ci#include <rdma/ib_pack.h> 4562306a36Sopenharmony_ci#include <rdma/uverbs_ioctl.h> 4662306a36Sopenharmony_ci 4762306a36Sopenharmony_ci#include "mthca_dev.h" 4862306a36Sopenharmony_ci#include "mthca_cmd.h" 4962306a36Sopenharmony_ci#include "mthca_memfree.h" 5062306a36Sopenharmony_ci#include "mthca_wqe.h" 5162306a36Sopenharmony_ci 5262306a36Sopenharmony_cienum { 5362306a36Sopenharmony_ci MTHCA_MAX_DIRECT_QP_SIZE = 4 * PAGE_SIZE, 5462306a36Sopenharmony_ci MTHCA_ACK_REQ_FREQ = 10, 5562306a36Sopenharmony_ci MTHCA_FLIGHT_LIMIT = 9, 5662306a36Sopenharmony_ci MTHCA_UD_HEADER_SIZE = 72, /* largest UD header possible */ 5762306a36Sopenharmony_ci MTHCA_INLINE_HEADER_SIZE = 4, /* data segment overhead for inline */ 5862306a36Sopenharmony_ci MTHCA_INLINE_CHUNK_SIZE = 16 /* inline data segment chunk */ 5962306a36Sopenharmony_ci}; 6062306a36Sopenharmony_ci 6162306a36Sopenharmony_cienum { 6262306a36Sopenharmony_ci MTHCA_QP_STATE_RST = 0, 6362306a36Sopenharmony_ci MTHCA_QP_STATE_INIT = 1, 6462306a36Sopenharmony_ci MTHCA_QP_STATE_RTR = 2, 6562306a36Sopenharmony_ci MTHCA_QP_STATE_RTS = 3, 6662306a36Sopenharmony_ci MTHCA_QP_STATE_SQE = 4, 6762306a36Sopenharmony_ci MTHCA_QP_STATE_SQD = 5, 6862306a36Sopenharmony_ci MTHCA_QP_STATE_ERR = 6, 6962306a36Sopenharmony_ci MTHCA_QP_STATE_DRAINING = 7 7062306a36Sopenharmony_ci}; 7162306a36Sopenharmony_ci 7262306a36Sopenharmony_cienum { 7362306a36Sopenharmony_ci MTHCA_QP_ST_RC = 0x0, 7462306a36Sopenharmony_ci MTHCA_QP_ST_UC = 0x1, 7562306a36Sopenharmony_ci MTHCA_QP_ST_RD = 0x2, 7662306a36Sopenharmony_ci MTHCA_QP_ST_UD = 0x3, 7762306a36Sopenharmony_ci MTHCA_QP_ST_MLX = 0x7 7862306a36Sopenharmony_ci}; 7962306a36Sopenharmony_ci 8062306a36Sopenharmony_cienum { 8162306a36Sopenharmony_ci MTHCA_QP_PM_MIGRATED = 0x3, 8262306a36Sopenharmony_ci MTHCA_QP_PM_ARMED = 0x0, 8362306a36Sopenharmony_ci MTHCA_QP_PM_REARM = 0x1 8462306a36Sopenharmony_ci}; 8562306a36Sopenharmony_ci 8662306a36Sopenharmony_cienum { 8762306a36Sopenharmony_ci /* qp_context flags */ 8862306a36Sopenharmony_ci MTHCA_QP_BIT_DE = 1 << 8, 8962306a36Sopenharmony_ci /* params1 */ 9062306a36Sopenharmony_ci MTHCA_QP_BIT_SRE = 1 << 15, 9162306a36Sopenharmony_ci MTHCA_QP_BIT_SWE = 1 << 14, 9262306a36Sopenharmony_ci MTHCA_QP_BIT_SAE = 1 << 13, 9362306a36Sopenharmony_ci MTHCA_QP_BIT_SIC = 1 << 4, 9462306a36Sopenharmony_ci MTHCA_QP_BIT_SSC = 1 << 3, 9562306a36Sopenharmony_ci /* params2 */ 9662306a36Sopenharmony_ci MTHCA_QP_BIT_RRE = 1 << 15, 9762306a36Sopenharmony_ci MTHCA_QP_BIT_RWE = 1 << 14, 9862306a36Sopenharmony_ci MTHCA_QP_BIT_RAE = 1 << 13, 9962306a36Sopenharmony_ci MTHCA_QP_BIT_RIC = 1 << 4, 10062306a36Sopenharmony_ci MTHCA_QP_BIT_RSC = 1 << 3 10162306a36Sopenharmony_ci}; 10262306a36Sopenharmony_ci 10362306a36Sopenharmony_cienum { 10462306a36Sopenharmony_ci MTHCA_SEND_DOORBELL_FENCE = 1 << 5 10562306a36Sopenharmony_ci}; 10662306a36Sopenharmony_ci 10762306a36Sopenharmony_cistruct mthca_qp_path { 10862306a36Sopenharmony_ci __be32 port_pkey; 10962306a36Sopenharmony_ci u8 rnr_retry; 11062306a36Sopenharmony_ci u8 g_mylmc; 11162306a36Sopenharmony_ci __be16 rlid; 11262306a36Sopenharmony_ci u8 ackto; 11362306a36Sopenharmony_ci u8 mgid_index; 11462306a36Sopenharmony_ci u8 static_rate; 11562306a36Sopenharmony_ci u8 hop_limit; 11662306a36Sopenharmony_ci __be32 sl_tclass_flowlabel; 11762306a36Sopenharmony_ci u8 rgid[16]; 11862306a36Sopenharmony_ci} __packed; 11962306a36Sopenharmony_ci 12062306a36Sopenharmony_cistruct mthca_qp_context { 12162306a36Sopenharmony_ci __be32 flags; 12262306a36Sopenharmony_ci __be32 tavor_sched_queue; /* Reserved on Arbel */ 12362306a36Sopenharmony_ci u8 mtu_msgmax; 12462306a36Sopenharmony_ci u8 rq_size_stride; /* Reserved on Tavor */ 12562306a36Sopenharmony_ci u8 sq_size_stride; /* Reserved on Tavor */ 12662306a36Sopenharmony_ci u8 rlkey_arbel_sched_queue; /* Reserved on Tavor */ 12762306a36Sopenharmony_ci __be32 usr_page; 12862306a36Sopenharmony_ci __be32 local_qpn; 12962306a36Sopenharmony_ci __be32 remote_qpn; 13062306a36Sopenharmony_ci u32 reserved1[2]; 13162306a36Sopenharmony_ci struct mthca_qp_path pri_path; 13262306a36Sopenharmony_ci struct mthca_qp_path alt_path; 13362306a36Sopenharmony_ci __be32 rdd; 13462306a36Sopenharmony_ci __be32 pd; 13562306a36Sopenharmony_ci __be32 wqe_base; 13662306a36Sopenharmony_ci __be32 wqe_lkey; 13762306a36Sopenharmony_ci __be32 params1; 13862306a36Sopenharmony_ci __be32 reserved2; 13962306a36Sopenharmony_ci __be32 next_send_psn; 14062306a36Sopenharmony_ci __be32 cqn_snd; 14162306a36Sopenharmony_ci __be32 snd_wqe_base_l; /* Next send WQE on Tavor */ 14262306a36Sopenharmony_ci __be32 snd_db_index; /* (debugging only entries) */ 14362306a36Sopenharmony_ci __be32 last_acked_psn; 14462306a36Sopenharmony_ci __be32 ssn; 14562306a36Sopenharmony_ci __be32 params2; 14662306a36Sopenharmony_ci __be32 rnr_nextrecvpsn; 14762306a36Sopenharmony_ci __be32 ra_buff_indx; 14862306a36Sopenharmony_ci __be32 cqn_rcv; 14962306a36Sopenharmony_ci __be32 rcv_wqe_base_l; /* Next recv WQE on Tavor */ 15062306a36Sopenharmony_ci __be32 rcv_db_index; /* (debugging only entries) */ 15162306a36Sopenharmony_ci __be32 qkey; 15262306a36Sopenharmony_ci __be32 srqn; 15362306a36Sopenharmony_ci __be32 rmsn; 15462306a36Sopenharmony_ci __be16 rq_wqe_counter; /* reserved on Tavor */ 15562306a36Sopenharmony_ci __be16 sq_wqe_counter; /* reserved on Tavor */ 15662306a36Sopenharmony_ci u32 reserved3[18]; 15762306a36Sopenharmony_ci} __packed; 15862306a36Sopenharmony_ci 15962306a36Sopenharmony_cistruct mthca_qp_param { 16062306a36Sopenharmony_ci __be32 opt_param_mask; 16162306a36Sopenharmony_ci u32 reserved1; 16262306a36Sopenharmony_ci struct mthca_qp_context context; 16362306a36Sopenharmony_ci u32 reserved2[62]; 16462306a36Sopenharmony_ci} __packed; 16562306a36Sopenharmony_ci 16662306a36Sopenharmony_cienum { 16762306a36Sopenharmony_ci MTHCA_QP_OPTPAR_ALT_ADDR_PATH = 1 << 0, 16862306a36Sopenharmony_ci MTHCA_QP_OPTPAR_RRE = 1 << 1, 16962306a36Sopenharmony_ci MTHCA_QP_OPTPAR_RAE = 1 << 2, 17062306a36Sopenharmony_ci MTHCA_QP_OPTPAR_RWE = 1 << 3, 17162306a36Sopenharmony_ci MTHCA_QP_OPTPAR_PKEY_INDEX = 1 << 4, 17262306a36Sopenharmony_ci MTHCA_QP_OPTPAR_Q_KEY = 1 << 5, 17362306a36Sopenharmony_ci MTHCA_QP_OPTPAR_RNR_TIMEOUT = 1 << 6, 17462306a36Sopenharmony_ci MTHCA_QP_OPTPAR_PRIMARY_ADDR_PATH = 1 << 7, 17562306a36Sopenharmony_ci MTHCA_QP_OPTPAR_SRA_MAX = 1 << 8, 17662306a36Sopenharmony_ci MTHCA_QP_OPTPAR_RRA_MAX = 1 << 9, 17762306a36Sopenharmony_ci MTHCA_QP_OPTPAR_PM_STATE = 1 << 10, 17862306a36Sopenharmony_ci MTHCA_QP_OPTPAR_PORT_NUM = 1 << 11, 17962306a36Sopenharmony_ci MTHCA_QP_OPTPAR_RETRY_COUNT = 1 << 12, 18062306a36Sopenharmony_ci MTHCA_QP_OPTPAR_ALT_RNR_RETRY = 1 << 13, 18162306a36Sopenharmony_ci MTHCA_QP_OPTPAR_ACK_TIMEOUT = 1 << 14, 18262306a36Sopenharmony_ci MTHCA_QP_OPTPAR_RNR_RETRY = 1 << 15, 18362306a36Sopenharmony_ci MTHCA_QP_OPTPAR_SCHED_QUEUE = 1 << 16 18462306a36Sopenharmony_ci}; 18562306a36Sopenharmony_ci 18662306a36Sopenharmony_cistatic const u8 mthca_opcode[] = { 18762306a36Sopenharmony_ci [IB_WR_SEND] = MTHCA_OPCODE_SEND, 18862306a36Sopenharmony_ci [IB_WR_SEND_WITH_IMM] = MTHCA_OPCODE_SEND_IMM, 18962306a36Sopenharmony_ci [IB_WR_RDMA_WRITE] = MTHCA_OPCODE_RDMA_WRITE, 19062306a36Sopenharmony_ci [IB_WR_RDMA_WRITE_WITH_IMM] = MTHCA_OPCODE_RDMA_WRITE_IMM, 19162306a36Sopenharmony_ci [IB_WR_RDMA_READ] = MTHCA_OPCODE_RDMA_READ, 19262306a36Sopenharmony_ci [IB_WR_ATOMIC_CMP_AND_SWP] = MTHCA_OPCODE_ATOMIC_CS, 19362306a36Sopenharmony_ci [IB_WR_ATOMIC_FETCH_AND_ADD] = MTHCA_OPCODE_ATOMIC_FA, 19462306a36Sopenharmony_ci}; 19562306a36Sopenharmony_ci 19662306a36Sopenharmony_cistatic int is_sqp(struct mthca_dev *dev, struct mthca_qp *qp) 19762306a36Sopenharmony_ci{ 19862306a36Sopenharmony_ci return qp->qpn >= dev->qp_table.sqp_start && 19962306a36Sopenharmony_ci qp->qpn <= dev->qp_table.sqp_start + 3; 20062306a36Sopenharmony_ci} 20162306a36Sopenharmony_ci 20262306a36Sopenharmony_cistatic int is_qp0(struct mthca_dev *dev, struct mthca_qp *qp) 20362306a36Sopenharmony_ci{ 20462306a36Sopenharmony_ci return qp->qpn >= dev->qp_table.sqp_start && 20562306a36Sopenharmony_ci qp->qpn <= dev->qp_table.sqp_start + 1; 20662306a36Sopenharmony_ci} 20762306a36Sopenharmony_ci 20862306a36Sopenharmony_cistatic void *get_recv_wqe(struct mthca_qp *qp, int n) 20962306a36Sopenharmony_ci{ 21062306a36Sopenharmony_ci if (qp->is_direct) 21162306a36Sopenharmony_ci return qp->queue.direct.buf + (n << qp->rq.wqe_shift); 21262306a36Sopenharmony_ci else 21362306a36Sopenharmony_ci return qp->queue.page_list[(n << qp->rq.wqe_shift) >> PAGE_SHIFT].buf + 21462306a36Sopenharmony_ci ((n << qp->rq.wqe_shift) & (PAGE_SIZE - 1)); 21562306a36Sopenharmony_ci} 21662306a36Sopenharmony_ci 21762306a36Sopenharmony_cistatic void *get_send_wqe(struct mthca_qp *qp, int n) 21862306a36Sopenharmony_ci{ 21962306a36Sopenharmony_ci if (qp->is_direct) 22062306a36Sopenharmony_ci return qp->queue.direct.buf + qp->send_wqe_offset + 22162306a36Sopenharmony_ci (n << qp->sq.wqe_shift); 22262306a36Sopenharmony_ci else 22362306a36Sopenharmony_ci return qp->queue.page_list[(qp->send_wqe_offset + 22462306a36Sopenharmony_ci (n << qp->sq.wqe_shift)) >> 22562306a36Sopenharmony_ci PAGE_SHIFT].buf + 22662306a36Sopenharmony_ci ((qp->send_wqe_offset + (n << qp->sq.wqe_shift)) & 22762306a36Sopenharmony_ci (PAGE_SIZE - 1)); 22862306a36Sopenharmony_ci} 22962306a36Sopenharmony_ci 23062306a36Sopenharmony_cistatic void mthca_wq_reset(struct mthca_wq *wq) 23162306a36Sopenharmony_ci{ 23262306a36Sopenharmony_ci wq->next_ind = 0; 23362306a36Sopenharmony_ci wq->last_comp = wq->max - 1; 23462306a36Sopenharmony_ci wq->head = 0; 23562306a36Sopenharmony_ci wq->tail = 0; 23662306a36Sopenharmony_ci} 23762306a36Sopenharmony_ci 23862306a36Sopenharmony_civoid mthca_qp_event(struct mthca_dev *dev, u32 qpn, 23962306a36Sopenharmony_ci enum ib_event_type event_type) 24062306a36Sopenharmony_ci{ 24162306a36Sopenharmony_ci struct mthca_qp *qp; 24262306a36Sopenharmony_ci struct ib_event event; 24362306a36Sopenharmony_ci 24462306a36Sopenharmony_ci spin_lock(&dev->qp_table.lock); 24562306a36Sopenharmony_ci qp = mthca_array_get(&dev->qp_table.qp, qpn & (dev->limits.num_qps - 1)); 24662306a36Sopenharmony_ci if (qp) 24762306a36Sopenharmony_ci ++qp->refcount; 24862306a36Sopenharmony_ci spin_unlock(&dev->qp_table.lock); 24962306a36Sopenharmony_ci 25062306a36Sopenharmony_ci if (!qp) { 25162306a36Sopenharmony_ci mthca_warn(dev, "Async event %d for bogus QP %08x\n", 25262306a36Sopenharmony_ci event_type, qpn); 25362306a36Sopenharmony_ci return; 25462306a36Sopenharmony_ci } 25562306a36Sopenharmony_ci 25662306a36Sopenharmony_ci if (event_type == IB_EVENT_PATH_MIG) 25762306a36Sopenharmony_ci qp->port = qp->alt_port; 25862306a36Sopenharmony_ci 25962306a36Sopenharmony_ci event.device = &dev->ib_dev; 26062306a36Sopenharmony_ci event.event = event_type; 26162306a36Sopenharmony_ci event.element.qp = &qp->ibqp; 26262306a36Sopenharmony_ci if (qp->ibqp.event_handler) 26362306a36Sopenharmony_ci qp->ibqp.event_handler(&event, qp->ibqp.qp_context); 26462306a36Sopenharmony_ci 26562306a36Sopenharmony_ci spin_lock(&dev->qp_table.lock); 26662306a36Sopenharmony_ci if (!--qp->refcount) 26762306a36Sopenharmony_ci wake_up(&qp->wait); 26862306a36Sopenharmony_ci spin_unlock(&dev->qp_table.lock); 26962306a36Sopenharmony_ci} 27062306a36Sopenharmony_ci 27162306a36Sopenharmony_cistatic int to_mthca_state(enum ib_qp_state ib_state) 27262306a36Sopenharmony_ci{ 27362306a36Sopenharmony_ci switch (ib_state) { 27462306a36Sopenharmony_ci case IB_QPS_RESET: return MTHCA_QP_STATE_RST; 27562306a36Sopenharmony_ci case IB_QPS_INIT: return MTHCA_QP_STATE_INIT; 27662306a36Sopenharmony_ci case IB_QPS_RTR: return MTHCA_QP_STATE_RTR; 27762306a36Sopenharmony_ci case IB_QPS_RTS: return MTHCA_QP_STATE_RTS; 27862306a36Sopenharmony_ci case IB_QPS_SQD: return MTHCA_QP_STATE_SQD; 27962306a36Sopenharmony_ci case IB_QPS_SQE: return MTHCA_QP_STATE_SQE; 28062306a36Sopenharmony_ci case IB_QPS_ERR: return MTHCA_QP_STATE_ERR; 28162306a36Sopenharmony_ci default: return -1; 28262306a36Sopenharmony_ci } 28362306a36Sopenharmony_ci} 28462306a36Sopenharmony_ci 28562306a36Sopenharmony_cienum { RC, UC, UD, RD, RDEE, MLX, NUM_TRANS }; 28662306a36Sopenharmony_ci 28762306a36Sopenharmony_cistatic int to_mthca_st(int transport) 28862306a36Sopenharmony_ci{ 28962306a36Sopenharmony_ci switch (transport) { 29062306a36Sopenharmony_ci case RC: return MTHCA_QP_ST_RC; 29162306a36Sopenharmony_ci case UC: return MTHCA_QP_ST_UC; 29262306a36Sopenharmony_ci case UD: return MTHCA_QP_ST_UD; 29362306a36Sopenharmony_ci case RD: return MTHCA_QP_ST_RD; 29462306a36Sopenharmony_ci case MLX: return MTHCA_QP_ST_MLX; 29562306a36Sopenharmony_ci default: return -1; 29662306a36Sopenharmony_ci } 29762306a36Sopenharmony_ci} 29862306a36Sopenharmony_ci 29962306a36Sopenharmony_cistatic void store_attrs(struct mthca_sqp *sqp, const struct ib_qp_attr *attr, 30062306a36Sopenharmony_ci int attr_mask) 30162306a36Sopenharmony_ci{ 30262306a36Sopenharmony_ci if (attr_mask & IB_QP_PKEY_INDEX) 30362306a36Sopenharmony_ci sqp->pkey_index = attr->pkey_index; 30462306a36Sopenharmony_ci if (attr_mask & IB_QP_QKEY) 30562306a36Sopenharmony_ci sqp->qkey = attr->qkey; 30662306a36Sopenharmony_ci if (attr_mask & IB_QP_SQ_PSN) 30762306a36Sopenharmony_ci sqp->send_psn = attr->sq_psn; 30862306a36Sopenharmony_ci} 30962306a36Sopenharmony_ci 31062306a36Sopenharmony_cistatic void init_port(struct mthca_dev *dev, int port) 31162306a36Sopenharmony_ci{ 31262306a36Sopenharmony_ci int err; 31362306a36Sopenharmony_ci struct mthca_init_ib_param param; 31462306a36Sopenharmony_ci 31562306a36Sopenharmony_ci memset(¶m, 0, sizeof param); 31662306a36Sopenharmony_ci 31762306a36Sopenharmony_ci param.port_width = dev->limits.port_width_cap; 31862306a36Sopenharmony_ci param.vl_cap = dev->limits.vl_cap; 31962306a36Sopenharmony_ci param.mtu_cap = dev->limits.mtu_cap; 32062306a36Sopenharmony_ci param.gid_cap = dev->limits.gid_table_len; 32162306a36Sopenharmony_ci param.pkey_cap = dev->limits.pkey_table_len; 32262306a36Sopenharmony_ci 32362306a36Sopenharmony_ci err = mthca_INIT_IB(dev, ¶m, port); 32462306a36Sopenharmony_ci if (err) 32562306a36Sopenharmony_ci mthca_warn(dev, "INIT_IB failed, return code %d.\n", err); 32662306a36Sopenharmony_ci} 32762306a36Sopenharmony_ci 32862306a36Sopenharmony_cistatic __be32 get_hw_access_flags(struct mthca_qp *qp, const struct ib_qp_attr *attr, 32962306a36Sopenharmony_ci int attr_mask) 33062306a36Sopenharmony_ci{ 33162306a36Sopenharmony_ci u8 dest_rd_atomic; 33262306a36Sopenharmony_ci u32 access_flags; 33362306a36Sopenharmony_ci u32 hw_access_flags = 0; 33462306a36Sopenharmony_ci 33562306a36Sopenharmony_ci if (attr_mask & IB_QP_MAX_DEST_RD_ATOMIC) 33662306a36Sopenharmony_ci dest_rd_atomic = attr->max_dest_rd_atomic; 33762306a36Sopenharmony_ci else 33862306a36Sopenharmony_ci dest_rd_atomic = qp->resp_depth; 33962306a36Sopenharmony_ci 34062306a36Sopenharmony_ci if (attr_mask & IB_QP_ACCESS_FLAGS) 34162306a36Sopenharmony_ci access_flags = attr->qp_access_flags; 34262306a36Sopenharmony_ci else 34362306a36Sopenharmony_ci access_flags = qp->atomic_rd_en; 34462306a36Sopenharmony_ci 34562306a36Sopenharmony_ci if (!dest_rd_atomic) 34662306a36Sopenharmony_ci access_flags &= IB_ACCESS_REMOTE_WRITE; 34762306a36Sopenharmony_ci 34862306a36Sopenharmony_ci if (access_flags & IB_ACCESS_REMOTE_READ) 34962306a36Sopenharmony_ci hw_access_flags |= MTHCA_QP_BIT_RRE; 35062306a36Sopenharmony_ci if (access_flags & IB_ACCESS_REMOTE_ATOMIC) 35162306a36Sopenharmony_ci hw_access_flags |= MTHCA_QP_BIT_RAE; 35262306a36Sopenharmony_ci if (access_flags & IB_ACCESS_REMOTE_WRITE) 35362306a36Sopenharmony_ci hw_access_flags |= MTHCA_QP_BIT_RWE; 35462306a36Sopenharmony_ci 35562306a36Sopenharmony_ci return cpu_to_be32(hw_access_flags); 35662306a36Sopenharmony_ci} 35762306a36Sopenharmony_ci 35862306a36Sopenharmony_cistatic inline enum ib_qp_state to_ib_qp_state(int mthca_state) 35962306a36Sopenharmony_ci{ 36062306a36Sopenharmony_ci switch (mthca_state) { 36162306a36Sopenharmony_ci case MTHCA_QP_STATE_RST: return IB_QPS_RESET; 36262306a36Sopenharmony_ci case MTHCA_QP_STATE_INIT: return IB_QPS_INIT; 36362306a36Sopenharmony_ci case MTHCA_QP_STATE_RTR: return IB_QPS_RTR; 36462306a36Sopenharmony_ci case MTHCA_QP_STATE_RTS: return IB_QPS_RTS; 36562306a36Sopenharmony_ci case MTHCA_QP_STATE_DRAINING: 36662306a36Sopenharmony_ci case MTHCA_QP_STATE_SQD: return IB_QPS_SQD; 36762306a36Sopenharmony_ci case MTHCA_QP_STATE_SQE: return IB_QPS_SQE; 36862306a36Sopenharmony_ci case MTHCA_QP_STATE_ERR: return IB_QPS_ERR; 36962306a36Sopenharmony_ci default: return -1; 37062306a36Sopenharmony_ci } 37162306a36Sopenharmony_ci} 37262306a36Sopenharmony_ci 37362306a36Sopenharmony_cistatic inline enum ib_mig_state to_ib_mig_state(int mthca_mig_state) 37462306a36Sopenharmony_ci{ 37562306a36Sopenharmony_ci switch (mthca_mig_state) { 37662306a36Sopenharmony_ci case 0: return IB_MIG_ARMED; 37762306a36Sopenharmony_ci case 1: return IB_MIG_REARM; 37862306a36Sopenharmony_ci case 3: return IB_MIG_MIGRATED; 37962306a36Sopenharmony_ci default: return -1; 38062306a36Sopenharmony_ci } 38162306a36Sopenharmony_ci} 38262306a36Sopenharmony_ci 38362306a36Sopenharmony_cistatic int to_ib_qp_access_flags(int mthca_flags) 38462306a36Sopenharmony_ci{ 38562306a36Sopenharmony_ci int ib_flags = 0; 38662306a36Sopenharmony_ci 38762306a36Sopenharmony_ci if (mthca_flags & MTHCA_QP_BIT_RRE) 38862306a36Sopenharmony_ci ib_flags |= IB_ACCESS_REMOTE_READ; 38962306a36Sopenharmony_ci if (mthca_flags & MTHCA_QP_BIT_RWE) 39062306a36Sopenharmony_ci ib_flags |= IB_ACCESS_REMOTE_WRITE; 39162306a36Sopenharmony_ci if (mthca_flags & MTHCA_QP_BIT_RAE) 39262306a36Sopenharmony_ci ib_flags |= IB_ACCESS_REMOTE_ATOMIC; 39362306a36Sopenharmony_ci 39462306a36Sopenharmony_ci return ib_flags; 39562306a36Sopenharmony_ci} 39662306a36Sopenharmony_ci 39762306a36Sopenharmony_cistatic void to_rdma_ah_attr(struct mthca_dev *dev, 39862306a36Sopenharmony_ci struct rdma_ah_attr *ah_attr, 39962306a36Sopenharmony_ci struct mthca_qp_path *path) 40062306a36Sopenharmony_ci{ 40162306a36Sopenharmony_ci u8 port_num = (be32_to_cpu(path->port_pkey) >> 24) & 0x3; 40262306a36Sopenharmony_ci 40362306a36Sopenharmony_ci memset(ah_attr, 0, sizeof(*ah_attr)); 40462306a36Sopenharmony_ci 40562306a36Sopenharmony_ci if (port_num == 0 || port_num > dev->limits.num_ports) 40662306a36Sopenharmony_ci return; 40762306a36Sopenharmony_ci ah_attr->type = rdma_ah_find_type(&dev->ib_dev, port_num); 40862306a36Sopenharmony_ci rdma_ah_set_port_num(ah_attr, port_num); 40962306a36Sopenharmony_ci 41062306a36Sopenharmony_ci rdma_ah_set_dlid(ah_attr, be16_to_cpu(path->rlid)); 41162306a36Sopenharmony_ci rdma_ah_set_sl(ah_attr, be32_to_cpu(path->sl_tclass_flowlabel) >> 28); 41262306a36Sopenharmony_ci rdma_ah_set_path_bits(ah_attr, path->g_mylmc & 0x7f); 41362306a36Sopenharmony_ci rdma_ah_set_static_rate(ah_attr, 41462306a36Sopenharmony_ci mthca_rate_to_ib(dev, 41562306a36Sopenharmony_ci path->static_rate & 0xf, 41662306a36Sopenharmony_ci port_num)); 41762306a36Sopenharmony_ci if (path->g_mylmc & (1 << 7)) { 41862306a36Sopenharmony_ci u32 tc_fl = be32_to_cpu(path->sl_tclass_flowlabel); 41962306a36Sopenharmony_ci 42062306a36Sopenharmony_ci rdma_ah_set_grh(ah_attr, NULL, 42162306a36Sopenharmony_ci tc_fl & 0xfffff, 42262306a36Sopenharmony_ci path->mgid_index & 42362306a36Sopenharmony_ci (dev->limits.gid_table_len - 1), 42462306a36Sopenharmony_ci path->hop_limit, 42562306a36Sopenharmony_ci (tc_fl >> 20) & 0xff); 42662306a36Sopenharmony_ci rdma_ah_set_dgid_raw(ah_attr, path->rgid); 42762306a36Sopenharmony_ci } 42862306a36Sopenharmony_ci} 42962306a36Sopenharmony_ci 43062306a36Sopenharmony_ciint mthca_query_qp(struct ib_qp *ibqp, struct ib_qp_attr *qp_attr, int qp_attr_mask, 43162306a36Sopenharmony_ci struct ib_qp_init_attr *qp_init_attr) 43262306a36Sopenharmony_ci{ 43362306a36Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 43462306a36Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 43562306a36Sopenharmony_ci int err = 0; 43662306a36Sopenharmony_ci struct mthca_mailbox *mailbox = NULL; 43762306a36Sopenharmony_ci struct mthca_qp_param *qp_param; 43862306a36Sopenharmony_ci struct mthca_qp_context *context; 43962306a36Sopenharmony_ci int mthca_state; 44062306a36Sopenharmony_ci 44162306a36Sopenharmony_ci mutex_lock(&qp->mutex); 44262306a36Sopenharmony_ci 44362306a36Sopenharmony_ci if (qp->state == IB_QPS_RESET) { 44462306a36Sopenharmony_ci qp_attr->qp_state = IB_QPS_RESET; 44562306a36Sopenharmony_ci goto done; 44662306a36Sopenharmony_ci } 44762306a36Sopenharmony_ci 44862306a36Sopenharmony_ci mailbox = mthca_alloc_mailbox(dev, GFP_KERNEL); 44962306a36Sopenharmony_ci if (IS_ERR(mailbox)) { 45062306a36Sopenharmony_ci err = PTR_ERR(mailbox); 45162306a36Sopenharmony_ci goto out; 45262306a36Sopenharmony_ci } 45362306a36Sopenharmony_ci 45462306a36Sopenharmony_ci err = mthca_QUERY_QP(dev, qp->qpn, 0, mailbox); 45562306a36Sopenharmony_ci if (err) { 45662306a36Sopenharmony_ci mthca_warn(dev, "QUERY_QP failed (%d)\n", err); 45762306a36Sopenharmony_ci goto out_mailbox; 45862306a36Sopenharmony_ci } 45962306a36Sopenharmony_ci 46062306a36Sopenharmony_ci qp_param = mailbox->buf; 46162306a36Sopenharmony_ci context = &qp_param->context; 46262306a36Sopenharmony_ci mthca_state = be32_to_cpu(context->flags) >> 28; 46362306a36Sopenharmony_ci 46462306a36Sopenharmony_ci qp->state = to_ib_qp_state(mthca_state); 46562306a36Sopenharmony_ci qp_attr->qp_state = qp->state; 46662306a36Sopenharmony_ci qp_attr->path_mtu = context->mtu_msgmax >> 5; 46762306a36Sopenharmony_ci qp_attr->path_mig_state = 46862306a36Sopenharmony_ci to_ib_mig_state((be32_to_cpu(context->flags) >> 11) & 0x3); 46962306a36Sopenharmony_ci qp_attr->qkey = be32_to_cpu(context->qkey); 47062306a36Sopenharmony_ci qp_attr->rq_psn = be32_to_cpu(context->rnr_nextrecvpsn) & 0xffffff; 47162306a36Sopenharmony_ci qp_attr->sq_psn = be32_to_cpu(context->next_send_psn) & 0xffffff; 47262306a36Sopenharmony_ci qp_attr->dest_qp_num = be32_to_cpu(context->remote_qpn) & 0xffffff; 47362306a36Sopenharmony_ci qp_attr->qp_access_flags = 47462306a36Sopenharmony_ci to_ib_qp_access_flags(be32_to_cpu(context->params2)); 47562306a36Sopenharmony_ci 47662306a36Sopenharmony_ci if (qp->transport == RC || qp->transport == UC) { 47762306a36Sopenharmony_ci to_rdma_ah_attr(dev, &qp_attr->ah_attr, &context->pri_path); 47862306a36Sopenharmony_ci to_rdma_ah_attr(dev, &qp_attr->alt_ah_attr, &context->alt_path); 47962306a36Sopenharmony_ci qp_attr->alt_pkey_index = 48062306a36Sopenharmony_ci be32_to_cpu(context->alt_path.port_pkey) & 0x7f; 48162306a36Sopenharmony_ci qp_attr->alt_port_num = 48262306a36Sopenharmony_ci rdma_ah_get_port_num(&qp_attr->alt_ah_attr); 48362306a36Sopenharmony_ci } 48462306a36Sopenharmony_ci 48562306a36Sopenharmony_ci qp_attr->pkey_index = be32_to_cpu(context->pri_path.port_pkey) & 0x7f; 48662306a36Sopenharmony_ci qp_attr->port_num = 48762306a36Sopenharmony_ci (be32_to_cpu(context->pri_path.port_pkey) >> 24) & 0x3; 48862306a36Sopenharmony_ci 48962306a36Sopenharmony_ci /* qp_attr->en_sqd_async_notify is only applicable in modify qp */ 49062306a36Sopenharmony_ci qp_attr->sq_draining = mthca_state == MTHCA_QP_STATE_DRAINING; 49162306a36Sopenharmony_ci 49262306a36Sopenharmony_ci qp_attr->max_rd_atomic = 1 << ((be32_to_cpu(context->params1) >> 21) & 0x7); 49362306a36Sopenharmony_ci 49462306a36Sopenharmony_ci qp_attr->max_dest_rd_atomic = 49562306a36Sopenharmony_ci 1 << ((be32_to_cpu(context->params2) >> 21) & 0x7); 49662306a36Sopenharmony_ci qp_attr->min_rnr_timer = 49762306a36Sopenharmony_ci (be32_to_cpu(context->rnr_nextrecvpsn) >> 24) & 0x1f; 49862306a36Sopenharmony_ci qp_attr->timeout = context->pri_path.ackto >> 3; 49962306a36Sopenharmony_ci qp_attr->retry_cnt = (be32_to_cpu(context->params1) >> 16) & 0x7; 50062306a36Sopenharmony_ci qp_attr->rnr_retry = context->pri_path.rnr_retry >> 5; 50162306a36Sopenharmony_ci qp_attr->alt_timeout = context->alt_path.ackto >> 3; 50262306a36Sopenharmony_ci 50362306a36Sopenharmony_cidone: 50462306a36Sopenharmony_ci qp_attr->cur_qp_state = qp_attr->qp_state; 50562306a36Sopenharmony_ci qp_attr->cap.max_send_wr = qp->sq.max; 50662306a36Sopenharmony_ci qp_attr->cap.max_recv_wr = qp->rq.max; 50762306a36Sopenharmony_ci qp_attr->cap.max_send_sge = qp->sq.max_gs; 50862306a36Sopenharmony_ci qp_attr->cap.max_recv_sge = qp->rq.max_gs; 50962306a36Sopenharmony_ci qp_attr->cap.max_inline_data = qp->max_inline_data; 51062306a36Sopenharmony_ci 51162306a36Sopenharmony_ci qp_init_attr->cap = qp_attr->cap; 51262306a36Sopenharmony_ci qp_init_attr->sq_sig_type = qp->sq_policy; 51362306a36Sopenharmony_ci 51462306a36Sopenharmony_ciout_mailbox: 51562306a36Sopenharmony_ci mthca_free_mailbox(dev, mailbox); 51662306a36Sopenharmony_ci 51762306a36Sopenharmony_ciout: 51862306a36Sopenharmony_ci mutex_unlock(&qp->mutex); 51962306a36Sopenharmony_ci return err; 52062306a36Sopenharmony_ci} 52162306a36Sopenharmony_ci 52262306a36Sopenharmony_cistatic int mthca_path_set(struct mthca_dev *dev, const struct rdma_ah_attr *ah, 52362306a36Sopenharmony_ci struct mthca_qp_path *path, u8 port) 52462306a36Sopenharmony_ci{ 52562306a36Sopenharmony_ci path->g_mylmc = rdma_ah_get_path_bits(ah) & 0x7f; 52662306a36Sopenharmony_ci path->rlid = cpu_to_be16(rdma_ah_get_dlid(ah)); 52762306a36Sopenharmony_ci path->static_rate = mthca_get_rate(dev, rdma_ah_get_static_rate(ah), 52862306a36Sopenharmony_ci port); 52962306a36Sopenharmony_ci 53062306a36Sopenharmony_ci if (rdma_ah_get_ah_flags(ah) & IB_AH_GRH) { 53162306a36Sopenharmony_ci const struct ib_global_route *grh = rdma_ah_read_grh(ah); 53262306a36Sopenharmony_ci 53362306a36Sopenharmony_ci if (grh->sgid_index >= dev->limits.gid_table_len) { 53462306a36Sopenharmony_ci mthca_dbg(dev, "sgid_index (%u) too large. max is %d\n", 53562306a36Sopenharmony_ci grh->sgid_index, 53662306a36Sopenharmony_ci dev->limits.gid_table_len - 1); 53762306a36Sopenharmony_ci return -1; 53862306a36Sopenharmony_ci } 53962306a36Sopenharmony_ci 54062306a36Sopenharmony_ci path->g_mylmc |= 1 << 7; 54162306a36Sopenharmony_ci path->mgid_index = grh->sgid_index; 54262306a36Sopenharmony_ci path->hop_limit = grh->hop_limit; 54362306a36Sopenharmony_ci path->sl_tclass_flowlabel = 54462306a36Sopenharmony_ci cpu_to_be32((rdma_ah_get_sl(ah) << 28) | 54562306a36Sopenharmony_ci (grh->traffic_class << 20) | 54662306a36Sopenharmony_ci (grh->flow_label)); 54762306a36Sopenharmony_ci memcpy(path->rgid, grh->dgid.raw, 16); 54862306a36Sopenharmony_ci } else { 54962306a36Sopenharmony_ci path->sl_tclass_flowlabel = cpu_to_be32(rdma_ah_get_sl(ah) << 55062306a36Sopenharmony_ci 28); 55162306a36Sopenharmony_ci } 55262306a36Sopenharmony_ci 55362306a36Sopenharmony_ci return 0; 55462306a36Sopenharmony_ci} 55562306a36Sopenharmony_ci 55662306a36Sopenharmony_cistatic int __mthca_modify_qp(struct ib_qp *ibqp, 55762306a36Sopenharmony_ci const struct ib_qp_attr *attr, int attr_mask, 55862306a36Sopenharmony_ci enum ib_qp_state cur_state, 55962306a36Sopenharmony_ci enum ib_qp_state new_state, 56062306a36Sopenharmony_ci struct ib_udata *udata) 56162306a36Sopenharmony_ci{ 56262306a36Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 56362306a36Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 56462306a36Sopenharmony_ci struct mthca_ucontext *context = rdma_udata_to_drv_context( 56562306a36Sopenharmony_ci udata, struct mthca_ucontext, ibucontext); 56662306a36Sopenharmony_ci struct mthca_mailbox *mailbox; 56762306a36Sopenharmony_ci struct mthca_qp_param *qp_param; 56862306a36Sopenharmony_ci struct mthca_qp_context *qp_context; 56962306a36Sopenharmony_ci u32 sqd_event = 0; 57062306a36Sopenharmony_ci int err = -EINVAL; 57162306a36Sopenharmony_ci 57262306a36Sopenharmony_ci mailbox = mthca_alloc_mailbox(dev, GFP_KERNEL); 57362306a36Sopenharmony_ci if (IS_ERR(mailbox)) { 57462306a36Sopenharmony_ci err = PTR_ERR(mailbox); 57562306a36Sopenharmony_ci goto out; 57662306a36Sopenharmony_ci } 57762306a36Sopenharmony_ci qp_param = mailbox->buf; 57862306a36Sopenharmony_ci qp_context = &qp_param->context; 57962306a36Sopenharmony_ci memset(qp_param, 0, sizeof *qp_param); 58062306a36Sopenharmony_ci 58162306a36Sopenharmony_ci qp_context->flags = cpu_to_be32((to_mthca_state(new_state) << 28) | 58262306a36Sopenharmony_ci (to_mthca_st(qp->transport) << 16)); 58362306a36Sopenharmony_ci qp_context->flags |= cpu_to_be32(MTHCA_QP_BIT_DE); 58462306a36Sopenharmony_ci if (!(attr_mask & IB_QP_PATH_MIG_STATE)) 58562306a36Sopenharmony_ci qp_context->flags |= cpu_to_be32(MTHCA_QP_PM_MIGRATED << 11); 58662306a36Sopenharmony_ci else { 58762306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_PM_STATE); 58862306a36Sopenharmony_ci switch (attr->path_mig_state) { 58962306a36Sopenharmony_ci case IB_MIG_MIGRATED: 59062306a36Sopenharmony_ci qp_context->flags |= cpu_to_be32(MTHCA_QP_PM_MIGRATED << 11); 59162306a36Sopenharmony_ci break; 59262306a36Sopenharmony_ci case IB_MIG_REARM: 59362306a36Sopenharmony_ci qp_context->flags |= cpu_to_be32(MTHCA_QP_PM_REARM << 11); 59462306a36Sopenharmony_ci break; 59562306a36Sopenharmony_ci case IB_MIG_ARMED: 59662306a36Sopenharmony_ci qp_context->flags |= cpu_to_be32(MTHCA_QP_PM_ARMED << 11); 59762306a36Sopenharmony_ci break; 59862306a36Sopenharmony_ci } 59962306a36Sopenharmony_ci } 60062306a36Sopenharmony_ci 60162306a36Sopenharmony_ci /* leave tavor_sched_queue as 0 */ 60262306a36Sopenharmony_ci 60362306a36Sopenharmony_ci if (qp->transport == MLX || qp->transport == UD) 60462306a36Sopenharmony_ci qp_context->mtu_msgmax = (IB_MTU_2048 << 5) | 11; 60562306a36Sopenharmony_ci else if (attr_mask & IB_QP_PATH_MTU) { 60662306a36Sopenharmony_ci if (attr->path_mtu < IB_MTU_256 || attr->path_mtu > IB_MTU_2048) { 60762306a36Sopenharmony_ci mthca_dbg(dev, "path MTU (%u) is invalid\n", 60862306a36Sopenharmony_ci attr->path_mtu); 60962306a36Sopenharmony_ci goto out_mailbox; 61062306a36Sopenharmony_ci } 61162306a36Sopenharmony_ci qp_context->mtu_msgmax = (attr->path_mtu << 5) | 31; 61262306a36Sopenharmony_ci } 61362306a36Sopenharmony_ci 61462306a36Sopenharmony_ci if (mthca_is_memfree(dev)) { 61562306a36Sopenharmony_ci if (qp->rq.max) 61662306a36Sopenharmony_ci qp_context->rq_size_stride = ilog2(qp->rq.max) << 3; 61762306a36Sopenharmony_ci qp_context->rq_size_stride |= qp->rq.wqe_shift - 4; 61862306a36Sopenharmony_ci 61962306a36Sopenharmony_ci if (qp->sq.max) 62062306a36Sopenharmony_ci qp_context->sq_size_stride = ilog2(qp->sq.max) << 3; 62162306a36Sopenharmony_ci qp_context->sq_size_stride |= qp->sq.wqe_shift - 4; 62262306a36Sopenharmony_ci } 62362306a36Sopenharmony_ci 62462306a36Sopenharmony_ci /* leave arbel_sched_queue as 0 */ 62562306a36Sopenharmony_ci 62662306a36Sopenharmony_ci if (qp->ibqp.uobject) 62762306a36Sopenharmony_ci qp_context->usr_page = cpu_to_be32(context->uar.index); 62862306a36Sopenharmony_ci else 62962306a36Sopenharmony_ci qp_context->usr_page = cpu_to_be32(dev->driver_uar.index); 63062306a36Sopenharmony_ci qp_context->local_qpn = cpu_to_be32(qp->qpn); 63162306a36Sopenharmony_ci if (attr_mask & IB_QP_DEST_QPN) { 63262306a36Sopenharmony_ci qp_context->remote_qpn = cpu_to_be32(attr->dest_qp_num); 63362306a36Sopenharmony_ci } 63462306a36Sopenharmony_ci 63562306a36Sopenharmony_ci if (qp->transport == MLX) 63662306a36Sopenharmony_ci qp_context->pri_path.port_pkey |= 63762306a36Sopenharmony_ci cpu_to_be32(qp->port << 24); 63862306a36Sopenharmony_ci else { 63962306a36Sopenharmony_ci if (attr_mask & IB_QP_PORT) { 64062306a36Sopenharmony_ci qp_context->pri_path.port_pkey |= 64162306a36Sopenharmony_ci cpu_to_be32(attr->port_num << 24); 64262306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_PORT_NUM); 64362306a36Sopenharmony_ci } 64462306a36Sopenharmony_ci } 64562306a36Sopenharmony_ci 64662306a36Sopenharmony_ci if (attr_mask & IB_QP_PKEY_INDEX) { 64762306a36Sopenharmony_ci qp_context->pri_path.port_pkey |= 64862306a36Sopenharmony_ci cpu_to_be32(attr->pkey_index); 64962306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_PKEY_INDEX); 65062306a36Sopenharmony_ci } 65162306a36Sopenharmony_ci 65262306a36Sopenharmony_ci if (attr_mask & IB_QP_RNR_RETRY) { 65362306a36Sopenharmony_ci qp_context->alt_path.rnr_retry = qp_context->pri_path.rnr_retry = 65462306a36Sopenharmony_ci attr->rnr_retry << 5; 65562306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_RNR_RETRY | 65662306a36Sopenharmony_ci MTHCA_QP_OPTPAR_ALT_RNR_RETRY); 65762306a36Sopenharmony_ci } 65862306a36Sopenharmony_ci 65962306a36Sopenharmony_ci if (attr_mask & IB_QP_AV) { 66062306a36Sopenharmony_ci if (mthca_path_set(dev, &attr->ah_attr, &qp_context->pri_path, 66162306a36Sopenharmony_ci attr_mask & IB_QP_PORT ? attr->port_num : qp->port)) 66262306a36Sopenharmony_ci goto out_mailbox; 66362306a36Sopenharmony_ci 66462306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_PRIMARY_ADDR_PATH); 66562306a36Sopenharmony_ci } 66662306a36Sopenharmony_ci 66762306a36Sopenharmony_ci if (ibqp->qp_type == IB_QPT_RC && 66862306a36Sopenharmony_ci cur_state == IB_QPS_INIT && new_state == IB_QPS_RTR) { 66962306a36Sopenharmony_ci u8 sched_queue = ibqp->uobject ? 0x2 : 0x1; 67062306a36Sopenharmony_ci 67162306a36Sopenharmony_ci if (mthca_is_memfree(dev)) 67262306a36Sopenharmony_ci qp_context->rlkey_arbel_sched_queue |= sched_queue; 67362306a36Sopenharmony_ci else 67462306a36Sopenharmony_ci qp_context->tavor_sched_queue |= cpu_to_be32(sched_queue); 67562306a36Sopenharmony_ci 67662306a36Sopenharmony_ci qp_param->opt_param_mask |= 67762306a36Sopenharmony_ci cpu_to_be32(MTHCA_QP_OPTPAR_SCHED_QUEUE); 67862306a36Sopenharmony_ci } 67962306a36Sopenharmony_ci 68062306a36Sopenharmony_ci if (attr_mask & IB_QP_TIMEOUT) { 68162306a36Sopenharmony_ci qp_context->pri_path.ackto = attr->timeout << 3; 68262306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_ACK_TIMEOUT); 68362306a36Sopenharmony_ci } 68462306a36Sopenharmony_ci 68562306a36Sopenharmony_ci if (attr_mask & IB_QP_ALT_PATH) { 68662306a36Sopenharmony_ci if (attr->alt_pkey_index >= dev->limits.pkey_table_len) { 68762306a36Sopenharmony_ci mthca_dbg(dev, "Alternate P_Key index (%u) too large. max is %d\n", 68862306a36Sopenharmony_ci attr->alt_pkey_index, dev->limits.pkey_table_len-1); 68962306a36Sopenharmony_ci goto out_mailbox; 69062306a36Sopenharmony_ci } 69162306a36Sopenharmony_ci 69262306a36Sopenharmony_ci if (attr->alt_port_num == 0 || attr->alt_port_num > dev->limits.num_ports) { 69362306a36Sopenharmony_ci mthca_dbg(dev, "Alternate port number (%u) is invalid\n", 69462306a36Sopenharmony_ci attr->alt_port_num); 69562306a36Sopenharmony_ci goto out_mailbox; 69662306a36Sopenharmony_ci } 69762306a36Sopenharmony_ci 69862306a36Sopenharmony_ci if (mthca_path_set(dev, &attr->alt_ah_attr, &qp_context->alt_path, 69962306a36Sopenharmony_ci rdma_ah_get_port_num(&attr->alt_ah_attr))) 70062306a36Sopenharmony_ci goto out_mailbox; 70162306a36Sopenharmony_ci 70262306a36Sopenharmony_ci qp_context->alt_path.port_pkey |= cpu_to_be32(attr->alt_pkey_index | 70362306a36Sopenharmony_ci attr->alt_port_num << 24); 70462306a36Sopenharmony_ci qp_context->alt_path.ackto = attr->alt_timeout << 3; 70562306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_ALT_ADDR_PATH); 70662306a36Sopenharmony_ci } 70762306a36Sopenharmony_ci 70862306a36Sopenharmony_ci /* leave rdd as 0 */ 70962306a36Sopenharmony_ci qp_context->pd = cpu_to_be32(to_mpd(ibqp->pd)->pd_num); 71062306a36Sopenharmony_ci /* leave wqe_base as 0 (we always create an MR based at 0 for WQs) */ 71162306a36Sopenharmony_ci qp_context->wqe_lkey = cpu_to_be32(qp->mr.ibmr.lkey); 71262306a36Sopenharmony_ci qp_context->params1 = cpu_to_be32((MTHCA_ACK_REQ_FREQ << 28) | 71362306a36Sopenharmony_ci (MTHCA_FLIGHT_LIMIT << 24) | 71462306a36Sopenharmony_ci MTHCA_QP_BIT_SWE); 71562306a36Sopenharmony_ci if (qp->sq_policy == IB_SIGNAL_ALL_WR) 71662306a36Sopenharmony_ci qp_context->params1 |= cpu_to_be32(MTHCA_QP_BIT_SSC); 71762306a36Sopenharmony_ci if (attr_mask & IB_QP_RETRY_CNT) { 71862306a36Sopenharmony_ci qp_context->params1 |= cpu_to_be32(attr->retry_cnt << 16); 71962306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_RETRY_COUNT); 72062306a36Sopenharmony_ci } 72162306a36Sopenharmony_ci 72262306a36Sopenharmony_ci if (attr_mask & IB_QP_MAX_QP_RD_ATOMIC) { 72362306a36Sopenharmony_ci if (attr->max_rd_atomic) { 72462306a36Sopenharmony_ci qp_context->params1 |= 72562306a36Sopenharmony_ci cpu_to_be32(MTHCA_QP_BIT_SRE | 72662306a36Sopenharmony_ci MTHCA_QP_BIT_SAE); 72762306a36Sopenharmony_ci qp_context->params1 |= 72862306a36Sopenharmony_ci cpu_to_be32(fls(attr->max_rd_atomic - 1) << 21); 72962306a36Sopenharmony_ci } 73062306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_SRA_MAX); 73162306a36Sopenharmony_ci } 73262306a36Sopenharmony_ci 73362306a36Sopenharmony_ci if (attr_mask & IB_QP_SQ_PSN) 73462306a36Sopenharmony_ci qp_context->next_send_psn = cpu_to_be32(attr->sq_psn); 73562306a36Sopenharmony_ci qp_context->cqn_snd = cpu_to_be32(to_mcq(ibqp->send_cq)->cqn); 73662306a36Sopenharmony_ci 73762306a36Sopenharmony_ci if (mthca_is_memfree(dev)) { 73862306a36Sopenharmony_ci qp_context->snd_wqe_base_l = cpu_to_be32(qp->send_wqe_offset); 73962306a36Sopenharmony_ci qp_context->snd_db_index = cpu_to_be32(qp->sq.db_index); 74062306a36Sopenharmony_ci } 74162306a36Sopenharmony_ci 74262306a36Sopenharmony_ci if (attr_mask & IB_QP_MAX_DEST_RD_ATOMIC) { 74362306a36Sopenharmony_ci if (attr->max_dest_rd_atomic) 74462306a36Sopenharmony_ci qp_context->params2 |= 74562306a36Sopenharmony_ci cpu_to_be32(fls(attr->max_dest_rd_atomic - 1) << 21); 74662306a36Sopenharmony_ci 74762306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_RRA_MAX); 74862306a36Sopenharmony_ci } 74962306a36Sopenharmony_ci 75062306a36Sopenharmony_ci if (attr_mask & (IB_QP_ACCESS_FLAGS | IB_QP_MAX_DEST_RD_ATOMIC)) { 75162306a36Sopenharmony_ci qp_context->params2 |= get_hw_access_flags(qp, attr, attr_mask); 75262306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_RWE | 75362306a36Sopenharmony_ci MTHCA_QP_OPTPAR_RRE | 75462306a36Sopenharmony_ci MTHCA_QP_OPTPAR_RAE); 75562306a36Sopenharmony_ci } 75662306a36Sopenharmony_ci 75762306a36Sopenharmony_ci qp_context->params2 |= cpu_to_be32(MTHCA_QP_BIT_RSC); 75862306a36Sopenharmony_ci 75962306a36Sopenharmony_ci if (ibqp->srq) 76062306a36Sopenharmony_ci qp_context->params2 |= cpu_to_be32(MTHCA_QP_BIT_RIC); 76162306a36Sopenharmony_ci 76262306a36Sopenharmony_ci if (attr_mask & IB_QP_MIN_RNR_TIMER) { 76362306a36Sopenharmony_ci qp_context->rnr_nextrecvpsn |= cpu_to_be32(attr->min_rnr_timer << 24); 76462306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_RNR_TIMEOUT); 76562306a36Sopenharmony_ci } 76662306a36Sopenharmony_ci if (attr_mask & IB_QP_RQ_PSN) 76762306a36Sopenharmony_ci qp_context->rnr_nextrecvpsn |= cpu_to_be32(attr->rq_psn); 76862306a36Sopenharmony_ci 76962306a36Sopenharmony_ci qp_context->ra_buff_indx = 77062306a36Sopenharmony_ci cpu_to_be32(dev->qp_table.rdb_base + 77162306a36Sopenharmony_ci ((qp->qpn & (dev->limits.num_qps - 1)) * MTHCA_RDB_ENTRY_SIZE << 77262306a36Sopenharmony_ci dev->qp_table.rdb_shift)); 77362306a36Sopenharmony_ci 77462306a36Sopenharmony_ci qp_context->cqn_rcv = cpu_to_be32(to_mcq(ibqp->recv_cq)->cqn); 77562306a36Sopenharmony_ci 77662306a36Sopenharmony_ci if (mthca_is_memfree(dev)) 77762306a36Sopenharmony_ci qp_context->rcv_db_index = cpu_to_be32(qp->rq.db_index); 77862306a36Sopenharmony_ci 77962306a36Sopenharmony_ci if (attr_mask & IB_QP_QKEY) { 78062306a36Sopenharmony_ci qp_context->qkey = cpu_to_be32(attr->qkey); 78162306a36Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_Q_KEY); 78262306a36Sopenharmony_ci } 78362306a36Sopenharmony_ci 78462306a36Sopenharmony_ci if (ibqp->srq) 78562306a36Sopenharmony_ci qp_context->srqn = cpu_to_be32(1 << 24 | 78662306a36Sopenharmony_ci to_msrq(ibqp->srq)->srqn); 78762306a36Sopenharmony_ci 78862306a36Sopenharmony_ci if (cur_state == IB_QPS_RTS && new_state == IB_QPS_SQD && 78962306a36Sopenharmony_ci attr_mask & IB_QP_EN_SQD_ASYNC_NOTIFY && 79062306a36Sopenharmony_ci attr->en_sqd_async_notify) 79162306a36Sopenharmony_ci sqd_event = 1 << 31; 79262306a36Sopenharmony_ci 79362306a36Sopenharmony_ci err = mthca_MODIFY_QP(dev, cur_state, new_state, qp->qpn, 0, 79462306a36Sopenharmony_ci mailbox, sqd_event); 79562306a36Sopenharmony_ci if (err) { 79662306a36Sopenharmony_ci mthca_warn(dev, "modify QP %d->%d returned %d.\n", 79762306a36Sopenharmony_ci cur_state, new_state, err); 79862306a36Sopenharmony_ci goto out_mailbox; 79962306a36Sopenharmony_ci } 80062306a36Sopenharmony_ci 80162306a36Sopenharmony_ci qp->state = new_state; 80262306a36Sopenharmony_ci if (attr_mask & IB_QP_ACCESS_FLAGS) 80362306a36Sopenharmony_ci qp->atomic_rd_en = attr->qp_access_flags; 80462306a36Sopenharmony_ci if (attr_mask & IB_QP_MAX_DEST_RD_ATOMIC) 80562306a36Sopenharmony_ci qp->resp_depth = attr->max_dest_rd_atomic; 80662306a36Sopenharmony_ci if (attr_mask & IB_QP_PORT) 80762306a36Sopenharmony_ci qp->port = attr->port_num; 80862306a36Sopenharmony_ci if (attr_mask & IB_QP_ALT_PATH) 80962306a36Sopenharmony_ci qp->alt_port = attr->alt_port_num; 81062306a36Sopenharmony_ci 81162306a36Sopenharmony_ci if (is_sqp(dev, qp)) 81262306a36Sopenharmony_ci store_attrs(qp->sqp, attr, attr_mask); 81362306a36Sopenharmony_ci 81462306a36Sopenharmony_ci /* 81562306a36Sopenharmony_ci * If we moved QP0 to RTR, bring the IB link up; if we moved 81662306a36Sopenharmony_ci * QP0 to RESET or ERROR, bring the link back down. 81762306a36Sopenharmony_ci */ 81862306a36Sopenharmony_ci if (is_qp0(dev, qp)) { 81962306a36Sopenharmony_ci if (cur_state != IB_QPS_RTR && 82062306a36Sopenharmony_ci new_state == IB_QPS_RTR) 82162306a36Sopenharmony_ci init_port(dev, qp->port); 82262306a36Sopenharmony_ci 82362306a36Sopenharmony_ci if (cur_state != IB_QPS_RESET && 82462306a36Sopenharmony_ci cur_state != IB_QPS_ERR && 82562306a36Sopenharmony_ci (new_state == IB_QPS_RESET || 82662306a36Sopenharmony_ci new_state == IB_QPS_ERR)) 82762306a36Sopenharmony_ci mthca_CLOSE_IB(dev, qp->port); 82862306a36Sopenharmony_ci } 82962306a36Sopenharmony_ci 83062306a36Sopenharmony_ci /* 83162306a36Sopenharmony_ci * If we moved a kernel QP to RESET, clean up all old CQ 83262306a36Sopenharmony_ci * entries and reinitialize the QP. 83362306a36Sopenharmony_ci */ 83462306a36Sopenharmony_ci if (new_state == IB_QPS_RESET && !qp->ibqp.uobject) { 83562306a36Sopenharmony_ci mthca_cq_clean(dev, to_mcq(qp->ibqp.recv_cq), qp->qpn, 83662306a36Sopenharmony_ci qp->ibqp.srq ? to_msrq(qp->ibqp.srq) : NULL); 83762306a36Sopenharmony_ci if (qp->ibqp.send_cq != qp->ibqp.recv_cq) 83862306a36Sopenharmony_ci mthca_cq_clean(dev, to_mcq(qp->ibqp.send_cq), qp->qpn, NULL); 83962306a36Sopenharmony_ci 84062306a36Sopenharmony_ci mthca_wq_reset(&qp->sq); 84162306a36Sopenharmony_ci qp->sq.last = get_send_wqe(qp, qp->sq.max - 1); 84262306a36Sopenharmony_ci 84362306a36Sopenharmony_ci mthca_wq_reset(&qp->rq); 84462306a36Sopenharmony_ci qp->rq.last = get_recv_wqe(qp, qp->rq.max - 1); 84562306a36Sopenharmony_ci 84662306a36Sopenharmony_ci if (mthca_is_memfree(dev)) { 84762306a36Sopenharmony_ci *qp->sq.db = 0; 84862306a36Sopenharmony_ci *qp->rq.db = 0; 84962306a36Sopenharmony_ci } 85062306a36Sopenharmony_ci } 85162306a36Sopenharmony_ci 85262306a36Sopenharmony_ciout_mailbox: 85362306a36Sopenharmony_ci mthca_free_mailbox(dev, mailbox); 85462306a36Sopenharmony_ciout: 85562306a36Sopenharmony_ci return err; 85662306a36Sopenharmony_ci} 85762306a36Sopenharmony_ci 85862306a36Sopenharmony_ciint mthca_modify_qp(struct ib_qp *ibqp, struct ib_qp_attr *attr, int attr_mask, 85962306a36Sopenharmony_ci struct ib_udata *udata) 86062306a36Sopenharmony_ci{ 86162306a36Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 86262306a36Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 86362306a36Sopenharmony_ci enum ib_qp_state cur_state, new_state; 86462306a36Sopenharmony_ci int err = -EINVAL; 86562306a36Sopenharmony_ci 86662306a36Sopenharmony_ci if (attr_mask & ~IB_QP_ATTR_STANDARD_BITS) 86762306a36Sopenharmony_ci return -EOPNOTSUPP; 86862306a36Sopenharmony_ci 86962306a36Sopenharmony_ci mutex_lock(&qp->mutex); 87062306a36Sopenharmony_ci if (attr_mask & IB_QP_CUR_STATE) { 87162306a36Sopenharmony_ci cur_state = attr->cur_qp_state; 87262306a36Sopenharmony_ci } else { 87362306a36Sopenharmony_ci spin_lock_irq(&qp->sq.lock); 87462306a36Sopenharmony_ci spin_lock(&qp->rq.lock); 87562306a36Sopenharmony_ci cur_state = qp->state; 87662306a36Sopenharmony_ci spin_unlock(&qp->rq.lock); 87762306a36Sopenharmony_ci spin_unlock_irq(&qp->sq.lock); 87862306a36Sopenharmony_ci } 87962306a36Sopenharmony_ci 88062306a36Sopenharmony_ci new_state = attr_mask & IB_QP_STATE ? attr->qp_state : cur_state; 88162306a36Sopenharmony_ci 88262306a36Sopenharmony_ci if (!ib_modify_qp_is_ok(cur_state, new_state, ibqp->qp_type, 88362306a36Sopenharmony_ci attr_mask)) { 88462306a36Sopenharmony_ci mthca_dbg(dev, "Bad QP transition (transport %d) " 88562306a36Sopenharmony_ci "%d->%d with attr 0x%08x\n", 88662306a36Sopenharmony_ci qp->transport, cur_state, new_state, 88762306a36Sopenharmony_ci attr_mask); 88862306a36Sopenharmony_ci goto out; 88962306a36Sopenharmony_ci } 89062306a36Sopenharmony_ci 89162306a36Sopenharmony_ci if ((attr_mask & IB_QP_PKEY_INDEX) && 89262306a36Sopenharmony_ci attr->pkey_index >= dev->limits.pkey_table_len) { 89362306a36Sopenharmony_ci mthca_dbg(dev, "P_Key index (%u) too large. max is %d\n", 89462306a36Sopenharmony_ci attr->pkey_index, dev->limits.pkey_table_len-1); 89562306a36Sopenharmony_ci goto out; 89662306a36Sopenharmony_ci } 89762306a36Sopenharmony_ci 89862306a36Sopenharmony_ci if ((attr_mask & IB_QP_PORT) && 89962306a36Sopenharmony_ci (attr->port_num == 0 || attr->port_num > dev->limits.num_ports)) { 90062306a36Sopenharmony_ci mthca_dbg(dev, "Port number (%u) is invalid\n", attr->port_num); 90162306a36Sopenharmony_ci goto out; 90262306a36Sopenharmony_ci } 90362306a36Sopenharmony_ci 90462306a36Sopenharmony_ci if (attr_mask & IB_QP_MAX_QP_RD_ATOMIC && 90562306a36Sopenharmony_ci attr->max_rd_atomic > dev->limits.max_qp_init_rdma) { 90662306a36Sopenharmony_ci mthca_dbg(dev, "Max rdma_atomic as initiator %u too large (max is %d)\n", 90762306a36Sopenharmony_ci attr->max_rd_atomic, dev->limits.max_qp_init_rdma); 90862306a36Sopenharmony_ci goto out; 90962306a36Sopenharmony_ci } 91062306a36Sopenharmony_ci 91162306a36Sopenharmony_ci if (attr_mask & IB_QP_MAX_DEST_RD_ATOMIC && 91262306a36Sopenharmony_ci attr->max_dest_rd_atomic > 1 << dev->qp_table.rdb_shift) { 91362306a36Sopenharmony_ci mthca_dbg(dev, "Max rdma_atomic as responder %u too large (max %d)\n", 91462306a36Sopenharmony_ci attr->max_dest_rd_atomic, 1 << dev->qp_table.rdb_shift); 91562306a36Sopenharmony_ci goto out; 91662306a36Sopenharmony_ci } 91762306a36Sopenharmony_ci 91862306a36Sopenharmony_ci if (cur_state == new_state && cur_state == IB_QPS_RESET) { 91962306a36Sopenharmony_ci err = 0; 92062306a36Sopenharmony_ci goto out; 92162306a36Sopenharmony_ci } 92262306a36Sopenharmony_ci 92362306a36Sopenharmony_ci err = __mthca_modify_qp(ibqp, attr, attr_mask, cur_state, new_state, 92462306a36Sopenharmony_ci udata); 92562306a36Sopenharmony_ci 92662306a36Sopenharmony_ciout: 92762306a36Sopenharmony_ci mutex_unlock(&qp->mutex); 92862306a36Sopenharmony_ci return err; 92962306a36Sopenharmony_ci} 93062306a36Sopenharmony_ci 93162306a36Sopenharmony_cistatic int mthca_max_data_size(struct mthca_dev *dev, struct mthca_qp *qp, int desc_sz) 93262306a36Sopenharmony_ci{ 93362306a36Sopenharmony_ci /* 93462306a36Sopenharmony_ci * Calculate the maximum size of WQE s/g segments, excluding 93562306a36Sopenharmony_ci * the next segment and other non-data segments. 93662306a36Sopenharmony_ci */ 93762306a36Sopenharmony_ci int max_data_size = desc_sz - sizeof (struct mthca_next_seg); 93862306a36Sopenharmony_ci 93962306a36Sopenharmony_ci switch (qp->transport) { 94062306a36Sopenharmony_ci case MLX: 94162306a36Sopenharmony_ci max_data_size -= 2 * sizeof (struct mthca_data_seg); 94262306a36Sopenharmony_ci break; 94362306a36Sopenharmony_ci 94462306a36Sopenharmony_ci case UD: 94562306a36Sopenharmony_ci if (mthca_is_memfree(dev)) 94662306a36Sopenharmony_ci max_data_size -= sizeof (struct mthca_arbel_ud_seg); 94762306a36Sopenharmony_ci else 94862306a36Sopenharmony_ci max_data_size -= sizeof (struct mthca_tavor_ud_seg); 94962306a36Sopenharmony_ci break; 95062306a36Sopenharmony_ci 95162306a36Sopenharmony_ci default: 95262306a36Sopenharmony_ci max_data_size -= sizeof (struct mthca_raddr_seg); 95362306a36Sopenharmony_ci break; 95462306a36Sopenharmony_ci } 95562306a36Sopenharmony_ci 95662306a36Sopenharmony_ci return max_data_size; 95762306a36Sopenharmony_ci} 95862306a36Sopenharmony_ci 95962306a36Sopenharmony_cistatic inline int mthca_max_inline_data(struct mthca_pd *pd, int max_data_size) 96062306a36Sopenharmony_ci{ 96162306a36Sopenharmony_ci /* We don't support inline data for kernel QPs (yet). */ 96262306a36Sopenharmony_ci return pd->ibpd.uobject ? max_data_size - MTHCA_INLINE_HEADER_SIZE : 0; 96362306a36Sopenharmony_ci} 96462306a36Sopenharmony_ci 96562306a36Sopenharmony_cistatic void mthca_adjust_qp_caps(struct mthca_dev *dev, 96662306a36Sopenharmony_ci struct mthca_pd *pd, 96762306a36Sopenharmony_ci struct mthca_qp *qp) 96862306a36Sopenharmony_ci{ 96962306a36Sopenharmony_ci int max_data_size = mthca_max_data_size(dev, qp, 97062306a36Sopenharmony_ci min(dev->limits.max_desc_sz, 97162306a36Sopenharmony_ci 1 << qp->sq.wqe_shift)); 97262306a36Sopenharmony_ci 97362306a36Sopenharmony_ci qp->max_inline_data = mthca_max_inline_data(pd, max_data_size); 97462306a36Sopenharmony_ci 97562306a36Sopenharmony_ci qp->sq.max_gs = min_t(int, dev->limits.max_sg, 97662306a36Sopenharmony_ci max_data_size / sizeof (struct mthca_data_seg)); 97762306a36Sopenharmony_ci qp->rq.max_gs = min_t(int, dev->limits.max_sg, 97862306a36Sopenharmony_ci (min(dev->limits.max_desc_sz, 1 << qp->rq.wqe_shift) - 97962306a36Sopenharmony_ci sizeof (struct mthca_next_seg)) / 98062306a36Sopenharmony_ci sizeof (struct mthca_data_seg)); 98162306a36Sopenharmony_ci} 98262306a36Sopenharmony_ci 98362306a36Sopenharmony_ci/* 98462306a36Sopenharmony_ci * Allocate and register buffer for WQEs. qp->rq.max, sq.max, 98562306a36Sopenharmony_ci * rq.max_gs and sq.max_gs must all be assigned. 98662306a36Sopenharmony_ci * mthca_alloc_wqe_buf will calculate rq.wqe_shift and 98762306a36Sopenharmony_ci * sq.wqe_shift (as well as send_wqe_offset, is_direct, and 98862306a36Sopenharmony_ci * queue) 98962306a36Sopenharmony_ci */ 99062306a36Sopenharmony_cistatic int mthca_alloc_wqe_buf(struct mthca_dev *dev, 99162306a36Sopenharmony_ci struct mthca_pd *pd, 99262306a36Sopenharmony_ci struct mthca_qp *qp, 99362306a36Sopenharmony_ci struct ib_udata *udata) 99462306a36Sopenharmony_ci{ 99562306a36Sopenharmony_ci int size; 99662306a36Sopenharmony_ci int err = -ENOMEM; 99762306a36Sopenharmony_ci 99862306a36Sopenharmony_ci size = sizeof (struct mthca_next_seg) + 99962306a36Sopenharmony_ci qp->rq.max_gs * sizeof (struct mthca_data_seg); 100062306a36Sopenharmony_ci 100162306a36Sopenharmony_ci if (size > dev->limits.max_desc_sz) 100262306a36Sopenharmony_ci return -EINVAL; 100362306a36Sopenharmony_ci 100462306a36Sopenharmony_ci for (qp->rq.wqe_shift = 6; 1 << qp->rq.wqe_shift < size; 100562306a36Sopenharmony_ci qp->rq.wqe_shift++) 100662306a36Sopenharmony_ci ; /* nothing */ 100762306a36Sopenharmony_ci 100862306a36Sopenharmony_ci size = qp->sq.max_gs * sizeof (struct mthca_data_seg); 100962306a36Sopenharmony_ci switch (qp->transport) { 101062306a36Sopenharmony_ci case MLX: 101162306a36Sopenharmony_ci size += 2 * sizeof (struct mthca_data_seg); 101262306a36Sopenharmony_ci break; 101362306a36Sopenharmony_ci 101462306a36Sopenharmony_ci case UD: 101562306a36Sopenharmony_ci size += mthca_is_memfree(dev) ? 101662306a36Sopenharmony_ci sizeof (struct mthca_arbel_ud_seg) : 101762306a36Sopenharmony_ci sizeof (struct mthca_tavor_ud_seg); 101862306a36Sopenharmony_ci break; 101962306a36Sopenharmony_ci 102062306a36Sopenharmony_ci case UC: 102162306a36Sopenharmony_ci size += sizeof (struct mthca_raddr_seg); 102262306a36Sopenharmony_ci break; 102362306a36Sopenharmony_ci 102462306a36Sopenharmony_ci case RC: 102562306a36Sopenharmony_ci size += sizeof (struct mthca_raddr_seg); 102662306a36Sopenharmony_ci /* 102762306a36Sopenharmony_ci * An atomic op will require an atomic segment, a 102862306a36Sopenharmony_ci * remote address segment and one scatter entry. 102962306a36Sopenharmony_ci */ 103062306a36Sopenharmony_ci size = max_t(int, size, 103162306a36Sopenharmony_ci sizeof (struct mthca_atomic_seg) + 103262306a36Sopenharmony_ci sizeof (struct mthca_raddr_seg) + 103362306a36Sopenharmony_ci sizeof (struct mthca_data_seg)); 103462306a36Sopenharmony_ci break; 103562306a36Sopenharmony_ci 103662306a36Sopenharmony_ci default: 103762306a36Sopenharmony_ci break; 103862306a36Sopenharmony_ci } 103962306a36Sopenharmony_ci 104062306a36Sopenharmony_ci /* Make sure that we have enough space for a bind request */ 104162306a36Sopenharmony_ci size = max_t(int, size, sizeof (struct mthca_bind_seg)); 104262306a36Sopenharmony_ci 104362306a36Sopenharmony_ci size += sizeof (struct mthca_next_seg); 104462306a36Sopenharmony_ci 104562306a36Sopenharmony_ci if (size > dev->limits.max_desc_sz) 104662306a36Sopenharmony_ci return -EINVAL; 104762306a36Sopenharmony_ci 104862306a36Sopenharmony_ci for (qp->sq.wqe_shift = 6; 1 << qp->sq.wqe_shift < size; 104962306a36Sopenharmony_ci qp->sq.wqe_shift++) 105062306a36Sopenharmony_ci ; /* nothing */ 105162306a36Sopenharmony_ci 105262306a36Sopenharmony_ci qp->send_wqe_offset = ALIGN(qp->rq.max << qp->rq.wqe_shift, 105362306a36Sopenharmony_ci 1 << qp->sq.wqe_shift); 105462306a36Sopenharmony_ci 105562306a36Sopenharmony_ci /* 105662306a36Sopenharmony_ci * If this is a userspace QP, we don't actually have to 105762306a36Sopenharmony_ci * allocate anything. All we need is to calculate the WQE 105862306a36Sopenharmony_ci * sizes and the send_wqe_offset, so we're done now. 105962306a36Sopenharmony_ci */ 106062306a36Sopenharmony_ci if (udata) 106162306a36Sopenharmony_ci return 0; 106262306a36Sopenharmony_ci 106362306a36Sopenharmony_ci size = PAGE_ALIGN(qp->send_wqe_offset + 106462306a36Sopenharmony_ci (qp->sq.max << qp->sq.wqe_shift)); 106562306a36Sopenharmony_ci 106662306a36Sopenharmony_ci qp->wrid = kmalloc_array(qp->rq.max + qp->sq.max, sizeof(u64), 106762306a36Sopenharmony_ci GFP_KERNEL); 106862306a36Sopenharmony_ci if (!qp->wrid) 106962306a36Sopenharmony_ci goto err_out; 107062306a36Sopenharmony_ci 107162306a36Sopenharmony_ci err = mthca_buf_alloc(dev, size, MTHCA_MAX_DIRECT_QP_SIZE, 107262306a36Sopenharmony_ci &qp->queue, &qp->is_direct, pd, 0, &qp->mr); 107362306a36Sopenharmony_ci if (err) 107462306a36Sopenharmony_ci goto err_out; 107562306a36Sopenharmony_ci 107662306a36Sopenharmony_ci return 0; 107762306a36Sopenharmony_ci 107862306a36Sopenharmony_cierr_out: 107962306a36Sopenharmony_ci kfree(qp->wrid); 108062306a36Sopenharmony_ci return err; 108162306a36Sopenharmony_ci} 108262306a36Sopenharmony_ci 108362306a36Sopenharmony_cistatic void mthca_free_wqe_buf(struct mthca_dev *dev, 108462306a36Sopenharmony_ci struct mthca_qp *qp) 108562306a36Sopenharmony_ci{ 108662306a36Sopenharmony_ci mthca_buf_free(dev, PAGE_ALIGN(qp->send_wqe_offset + 108762306a36Sopenharmony_ci (qp->sq.max << qp->sq.wqe_shift)), 108862306a36Sopenharmony_ci &qp->queue, qp->is_direct, &qp->mr); 108962306a36Sopenharmony_ci kfree(qp->wrid); 109062306a36Sopenharmony_ci} 109162306a36Sopenharmony_ci 109262306a36Sopenharmony_cistatic int mthca_map_memfree(struct mthca_dev *dev, 109362306a36Sopenharmony_ci struct mthca_qp *qp) 109462306a36Sopenharmony_ci{ 109562306a36Sopenharmony_ci int ret; 109662306a36Sopenharmony_ci 109762306a36Sopenharmony_ci if (mthca_is_memfree(dev)) { 109862306a36Sopenharmony_ci ret = mthca_table_get(dev, dev->qp_table.qp_table, qp->qpn); 109962306a36Sopenharmony_ci if (ret) 110062306a36Sopenharmony_ci return ret; 110162306a36Sopenharmony_ci 110262306a36Sopenharmony_ci ret = mthca_table_get(dev, dev->qp_table.eqp_table, qp->qpn); 110362306a36Sopenharmony_ci if (ret) 110462306a36Sopenharmony_ci goto err_qpc; 110562306a36Sopenharmony_ci 110662306a36Sopenharmony_ci ret = mthca_table_get(dev, dev->qp_table.rdb_table, 110762306a36Sopenharmony_ci qp->qpn << dev->qp_table.rdb_shift); 110862306a36Sopenharmony_ci if (ret) 110962306a36Sopenharmony_ci goto err_eqpc; 111062306a36Sopenharmony_ci 111162306a36Sopenharmony_ci } 111262306a36Sopenharmony_ci 111362306a36Sopenharmony_ci return 0; 111462306a36Sopenharmony_ci 111562306a36Sopenharmony_cierr_eqpc: 111662306a36Sopenharmony_ci mthca_table_put(dev, dev->qp_table.eqp_table, qp->qpn); 111762306a36Sopenharmony_ci 111862306a36Sopenharmony_cierr_qpc: 111962306a36Sopenharmony_ci mthca_table_put(dev, dev->qp_table.qp_table, qp->qpn); 112062306a36Sopenharmony_ci 112162306a36Sopenharmony_ci return ret; 112262306a36Sopenharmony_ci} 112362306a36Sopenharmony_ci 112462306a36Sopenharmony_cistatic void mthca_unmap_memfree(struct mthca_dev *dev, 112562306a36Sopenharmony_ci struct mthca_qp *qp) 112662306a36Sopenharmony_ci{ 112762306a36Sopenharmony_ci mthca_table_put(dev, dev->qp_table.rdb_table, 112862306a36Sopenharmony_ci qp->qpn << dev->qp_table.rdb_shift); 112962306a36Sopenharmony_ci mthca_table_put(dev, dev->qp_table.eqp_table, qp->qpn); 113062306a36Sopenharmony_ci mthca_table_put(dev, dev->qp_table.qp_table, qp->qpn); 113162306a36Sopenharmony_ci} 113262306a36Sopenharmony_ci 113362306a36Sopenharmony_cistatic int mthca_alloc_memfree(struct mthca_dev *dev, 113462306a36Sopenharmony_ci struct mthca_qp *qp) 113562306a36Sopenharmony_ci{ 113662306a36Sopenharmony_ci if (mthca_is_memfree(dev)) { 113762306a36Sopenharmony_ci qp->rq.db_index = mthca_alloc_db(dev, MTHCA_DB_TYPE_RQ, 113862306a36Sopenharmony_ci qp->qpn, &qp->rq.db); 113962306a36Sopenharmony_ci if (qp->rq.db_index < 0) 114062306a36Sopenharmony_ci return -ENOMEM; 114162306a36Sopenharmony_ci 114262306a36Sopenharmony_ci qp->sq.db_index = mthca_alloc_db(dev, MTHCA_DB_TYPE_SQ, 114362306a36Sopenharmony_ci qp->qpn, &qp->sq.db); 114462306a36Sopenharmony_ci if (qp->sq.db_index < 0) { 114562306a36Sopenharmony_ci mthca_free_db(dev, MTHCA_DB_TYPE_RQ, qp->rq.db_index); 114662306a36Sopenharmony_ci return -ENOMEM; 114762306a36Sopenharmony_ci } 114862306a36Sopenharmony_ci } 114962306a36Sopenharmony_ci 115062306a36Sopenharmony_ci return 0; 115162306a36Sopenharmony_ci} 115262306a36Sopenharmony_ci 115362306a36Sopenharmony_cistatic void mthca_free_memfree(struct mthca_dev *dev, 115462306a36Sopenharmony_ci struct mthca_qp *qp) 115562306a36Sopenharmony_ci{ 115662306a36Sopenharmony_ci if (mthca_is_memfree(dev)) { 115762306a36Sopenharmony_ci mthca_free_db(dev, MTHCA_DB_TYPE_SQ, qp->sq.db_index); 115862306a36Sopenharmony_ci mthca_free_db(dev, MTHCA_DB_TYPE_RQ, qp->rq.db_index); 115962306a36Sopenharmony_ci } 116062306a36Sopenharmony_ci} 116162306a36Sopenharmony_ci 116262306a36Sopenharmony_cistatic int mthca_alloc_qp_common(struct mthca_dev *dev, 116362306a36Sopenharmony_ci struct mthca_pd *pd, 116462306a36Sopenharmony_ci struct mthca_cq *send_cq, 116562306a36Sopenharmony_ci struct mthca_cq *recv_cq, 116662306a36Sopenharmony_ci enum ib_sig_type send_policy, 116762306a36Sopenharmony_ci struct mthca_qp *qp, 116862306a36Sopenharmony_ci struct ib_udata *udata) 116962306a36Sopenharmony_ci{ 117062306a36Sopenharmony_ci int ret; 117162306a36Sopenharmony_ci int i; 117262306a36Sopenharmony_ci struct mthca_next_seg *next; 117362306a36Sopenharmony_ci 117462306a36Sopenharmony_ci qp->refcount = 1; 117562306a36Sopenharmony_ci init_waitqueue_head(&qp->wait); 117662306a36Sopenharmony_ci mutex_init(&qp->mutex); 117762306a36Sopenharmony_ci qp->state = IB_QPS_RESET; 117862306a36Sopenharmony_ci qp->atomic_rd_en = 0; 117962306a36Sopenharmony_ci qp->resp_depth = 0; 118062306a36Sopenharmony_ci qp->sq_policy = send_policy; 118162306a36Sopenharmony_ci mthca_wq_reset(&qp->sq); 118262306a36Sopenharmony_ci mthca_wq_reset(&qp->rq); 118362306a36Sopenharmony_ci 118462306a36Sopenharmony_ci spin_lock_init(&qp->sq.lock); 118562306a36Sopenharmony_ci spin_lock_init(&qp->rq.lock); 118662306a36Sopenharmony_ci 118762306a36Sopenharmony_ci ret = mthca_map_memfree(dev, qp); 118862306a36Sopenharmony_ci if (ret) 118962306a36Sopenharmony_ci return ret; 119062306a36Sopenharmony_ci 119162306a36Sopenharmony_ci ret = mthca_alloc_wqe_buf(dev, pd, qp, udata); 119262306a36Sopenharmony_ci if (ret) { 119362306a36Sopenharmony_ci mthca_unmap_memfree(dev, qp); 119462306a36Sopenharmony_ci return ret; 119562306a36Sopenharmony_ci } 119662306a36Sopenharmony_ci 119762306a36Sopenharmony_ci mthca_adjust_qp_caps(dev, pd, qp); 119862306a36Sopenharmony_ci 119962306a36Sopenharmony_ci /* 120062306a36Sopenharmony_ci * If this is a userspace QP, we're done now. The doorbells 120162306a36Sopenharmony_ci * will be allocated and buffers will be initialized in 120262306a36Sopenharmony_ci * userspace. 120362306a36Sopenharmony_ci */ 120462306a36Sopenharmony_ci if (udata) 120562306a36Sopenharmony_ci return 0; 120662306a36Sopenharmony_ci 120762306a36Sopenharmony_ci ret = mthca_alloc_memfree(dev, qp); 120862306a36Sopenharmony_ci if (ret) { 120962306a36Sopenharmony_ci mthca_free_wqe_buf(dev, qp); 121062306a36Sopenharmony_ci mthca_unmap_memfree(dev, qp); 121162306a36Sopenharmony_ci return ret; 121262306a36Sopenharmony_ci } 121362306a36Sopenharmony_ci 121462306a36Sopenharmony_ci if (mthca_is_memfree(dev)) { 121562306a36Sopenharmony_ci struct mthca_data_seg *scatter; 121662306a36Sopenharmony_ci int size = (sizeof (struct mthca_next_seg) + 121762306a36Sopenharmony_ci qp->rq.max_gs * sizeof (struct mthca_data_seg)) / 16; 121862306a36Sopenharmony_ci 121962306a36Sopenharmony_ci for (i = 0; i < qp->rq.max; ++i) { 122062306a36Sopenharmony_ci next = get_recv_wqe(qp, i); 122162306a36Sopenharmony_ci next->nda_op = cpu_to_be32(((i + 1) & (qp->rq.max - 1)) << 122262306a36Sopenharmony_ci qp->rq.wqe_shift); 122362306a36Sopenharmony_ci next->ee_nds = cpu_to_be32(size); 122462306a36Sopenharmony_ci 122562306a36Sopenharmony_ci for (scatter = (void *) (next + 1); 122662306a36Sopenharmony_ci (void *) scatter < (void *) next + (1 << qp->rq.wqe_shift); 122762306a36Sopenharmony_ci ++scatter) 122862306a36Sopenharmony_ci scatter->lkey = cpu_to_be32(MTHCA_INVAL_LKEY); 122962306a36Sopenharmony_ci } 123062306a36Sopenharmony_ci 123162306a36Sopenharmony_ci for (i = 0; i < qp->sq.max; ++i) { 123262306a36Sopenharmony_ci next = get_send_wqe(qp, i); 123362306a36Sopenharmony_ci next->nda_op = cpu_to_be32((((i + 1) & (qp->sq.max - 1)) << 123462306a36Sopenharmony_ci qp->sq.wqe_shift) + 123562306a36Sopenharmony_ci qp->send_wqe_offset); 123662306a36Sopenharmony_ci } 123762306a36Sopenharmony_ci } else { 123862306a36Sopenharmony_ci for (i = 0; i < qp->rq.max; ++i) { 123962306a36Sopenharmony_ci next = get_recv_wqe(qp, i); 124062306a36Sopenharmony_ci next->nda_op = htonl((((i + 1) % qp->rq.max) << 124162306a36Sopenharmony_ci qp->rq.wqe_shift) | 1); 124262306a36Sopenharmony_ci } 124362306a36Sopenharmony_ci 124462306a36Sopenharmony_ci } 124562306a36Sopenharmony_ci 124662306a36Sopenharmony_ci qp->sq.last = get_send_wqe(qp, qp->sq.max - 1); 124762306a36Sopenharmony_ci qp->rq.last = get_recv_wqe(qp, qp->rq.max - 1); 124862306a36Sopenharmony_ci 124962306a36Sopenharmony_ci return 0; 125062306a36Sopenharmony_ci} 125162306a36Sopenharmony_ci 125262306a36Sopenharmony_cistatic int mthca_set_qp_size(struct mthca_dev *dev, struct ib_qp_cap *cap, 125362306a36Sopenharmony_ci struct mthca_pd *pd, struct mthca_qp *qp) 125462306a36Sopenharmony_ci{ 125562306a36Sopenharmony_ci int max_data_size = mthca_max_data_size(dev, qp, dev->limits.max_desc_sz); 125662306a36Sopenharmony_ci 125762306a36Sopenharmony_ci /* Sanity check QP size before proceeding */ 125862306a36Sopenharmony_ci if (cap->max_send_wr > dev->limits.max_wqes || 125962306a36Sopenharmony_ci cap->max_recv_wr > dev->limits.max_wqes || 126062306a36Sopenharmony_ci cap->max_send_sge > dev->limits.max_sg || 126162306a36Sopenharmony_ci cap->max_recv_sge > dev->limits.max_sg || 126262306a36Sopenharmony_ci cap->max_inline_data > mthca_max_inline_data(pd, max_data_size)) 126362306a36Sopenharmony_ci return -EINVAL; 126462306a36Sopenharmony_ci 126562306a36Sopenharmony_ci /* 126662306a36Sopenharmony_ci * For MLX transport we need 2 extra send gather entries: 126762306a36Sopenharmony_ci * one for the header and one for the checksum at the end 126862306a36Sopenharmony_ci */ 126962306a36Sopenharmony_ci if (qp->transport == MLX && cap->max_send_sge + 2 > dev->limits.max_sg) 127062306a36Sopenharmony_ci return -EINVAL; 127162306a36Sopenharmony_ci 127262306a36Sopenharmony_ci if (mthca_is_memfree(dev)) { 127362306a36Sopenharmony_ci qp->rq.max = cap->max_recv_wr ? 127462306a36Sopenharmony_ci roundup_pow_of_two(cap->max_recv_wr) : 0; 127562306a36Sopenharmony_ci qp->sq.max = cap->max_send_wr ? 127662306a36Sopenharmony_ci roundup_pow_of_two(cap->max_send_wr) : 0; 127762306a36Sopenharmony_ci } else { 127862306a36Sopenharmony_ci qp->rq.max = cap->max_recv_wr; 127962306a36Sopenharmony_ci qp->sq.max = cap->max_send_wr; 128062306a36Sopenharmony_ci } 128162306a36Sopenharmony_ci 128262306a36Sopenharmony_ci qp->rq.max_gs = cap->max_recv_sge; 128362306a36Sopenharmony_ci qp->sq.max_gs = max_t(int, cap->max_send_sge, 128462306a36Sopenharmony_ci ALIGN(cap->max_inline_data + MTHCA_INLINE_HEADER_SIZE, 128562306a36Sopenharmony_ci MTHCA_INLINE_CHUNK_SIZE) / 128662306a36Sopenharmony_ci sizeof (struct mthca_data_seg)); 128762306a36Sopenharmony_ci 128862306a36Sopenharmony_ci return 0; 128962306a36Sopenharmony_ci} 129062306a36Sopenharmony_ci 129162306a36Sopenharmony_ciint mthca_alloc_qp(struct mthca_dev *dev, 129262306a36Sopenharmony_ci struct mthca_pd *pd, 129362306a36Sopenharmony_ci struct mthca_cq *send_cq, 129462306a36Sopenharmony_ci struct mthca_cq *recv_cq, 129562306a36Sopenharmony_ci enum ib_qp_type type, 129662306a36Sopenharmony_ci enum ib_sig_type send_policy, 129762306a36Sopenharmony_ci struct ib_qp_cap *cap, 129862306a36Sopenharmony_ci struct mthca_qp *qp, 129962306a36Sopenharmony_ci struct ib_udata *udata) 130062306a36Sopenharmony_ci{ 130162306a36Sopenharmony_ci int err; 130262306a36Sopenharmony_ci 130362306a36Sopenharmony_ci switch (type) { 130462306a36Sopenharmony_ci case IB_QPT_RC: qp->transport = RC; break; 130562306a36Sopenharmony_ci case IB_QPT_UC: qp->transport = UC; break; 130662306a36Sopenharmony_ci case IB_QPT_UD: qp->transport = UD; break; 130762306a36Sopenharmony_ci default: return -EINVAL; 130862306a36Sopenharmony_ci } 130962306a36Sopenharmony_ci 131062306a36Sopenharmony_ci err = mthca_set_qp_size(dev, cap, pd, qp); 131162306a36Sopenharmony_ci if (err) 131262306a36Sopenharmony_ci return err; 131362306a36Sopenharmony_ci 131462306a36Sopenharmony_ci qp->qpn = mthca_alloc(&dev->qp_table.alloc); 131562306a36Sopenharmony_ci if (qp->qpn == -1) 131662306a36Sopenharmony_ci return -ENOMEM; 131762306a36Sopenharmony_ci 131862306a36Sopenharmony_ci /* initialize port to zero for error-catching. */ 131962306a36Sopenharmony_ci qp->port = 0; 132062306a36Sopenharmony_ci 132162306a36Sopenharmony_ci err = mthca_alloc_qp_common(dev, pd, send_cq, recv_cq, 132262306a36Sopenharmony_ci send_policy, qp, udata); 132362306a36Sopenharmony_ci if (err) { 132462306a36Sopenharmony_ci mthca_free(&dev->qp_table.alloc, qp->qpn); 132562306a36Sopenharmony_ci return err; 132662306a36Sopenharmony_ci } 132762306a36Sopenharmony_ci 132862306a36Sopenharmony_ci spin_lock_irq(&dev->qp_table.lock); 132962306a36Sopenharmony_ci mthca_array_set(&dev->qp_table.qp, 133062306a36Sopenharmony_ci qp->qpn & (dev->limits.num_qps - 1), qp); 133162306a36Sopenharmony_ci spin_unlock_irq(&dev->qp_table.lock); 133262306a36Sopenharmony_ci 133362306a36Sopenharmony_ci return 0; 133462306a36Sopenharmony_ci} 133562306a36Sopenharmony_ci 133662306a36Sopenharmony_cistatic void mthca_lock_cqs(struct mthca_cq *send_cq, struct mthca_cq *recv_cq) 133762306a36Sopenharmony_ci __acquires(&send_cq->lock) __acquires(&recv_cq->lock) 133862306a36Sopenharmony_ci{ 133962306a36Sopenharmony_ci if (send_cq == recv_cq) { 134062306a36Sopenharmony_ci spin_lock_irq(&send_cq->lock); 134162306a36Sopenharmony_ci __acquire(&recv_cq->lock); 134262306a36Sopenharmony_ci } else if (send_cq->cqn < recv_cq->cqn) { 134362306a36Sopenharmony_ci spin_lock_irq(&send_cq->lock); 134462306a36Sopenharmony_ci spin_lock_nested(&recv_cq->lock, SINGLE_DEPTH_NESTING); 134562306a36Sopenharmony_ci } else { 134662306a36Sopenharmony_ci spin_lock_irq(&recv_cq->lock); 134762306a36Sopenharmony_ci spin_lock_nested(&send_cq->lock, SINGLE_DEPTH_NESTING); 134862306a36Sopenharmony_ci } 134962306a36Sopenharmony_ci} 135062306a36Sopenharmony_ci 135162306a36Sopenharmony_cistatic void mthca_unlock_cqs(struct mthca_cq *send_cq, struct mthca_cq *recv_cq) 135262306a36Sopenharmony_ci __releases(&send_cq->lock) __releases(&recv_cq->lock) 135362306a36Sopenharmony_ci{ 135462306a36Sopenharmony_ci if (send_cq == recv_cq) { 135562306a36Sopenharmony_ci __release(&recv_cq->lock); 135662306a36Sopenharmony_ci spin_unlock_irq(&send_cq->lock); 135762306a36Sopenharmony_ci } else if (send_cq->cqn < recv_cq->cqn) { 135862306a36Sopenharmony_ci spin_unlock(&recv_cq->lock); 135962306a36Sopenharmony_ci spin_unlock_irq(&send_cq->lock); 136062306a36Sopenharmony_ci } else { 136162306a36Sopenharmony_ci spin_unlock(&send_cq->lock); 136262306a36Sopenharmony_ci spin_unlock_irq(&recv_cq->lock); 136362306a36Sopenharmony_ci } 136462306a36Sopenharmony_ci} 136562306a36Sopenharmony_ci 136662306a36Sopenharmony_ciint mthca_alloc_sqp(struct mthca_dev *dev, 136762306a36Sopenharmony_ci struct mthca_pd *pd, 136862306a36Sopenharmony_ci struct mthca_cq *send_cq, 136962306a36Sopenharmony_ci struct mthca_cq *recv_cq, 137062306a36Sopenharmony_ci enum ib_sig_type send_policy, 137162306a36Sopenharmony_ci struct ib_qp_cap *cap, 137262306a36Sopenharmony_ci int qpn, 137362306a36Sopenharmony_ci u32 port, 137462306a36Sopenharmony_ci struct mthca_qp *qp, 137562306a36Sopenharmony_ci struct ib_udata *udata) 137662306a36Sopenharmony_ci{ 137762306a36Sopenharmony_ci u32 mqpn = qpn * 2 + dev->qp_table.sqp_start + port - 1; 137862306a36Sopenharmony_ci int err; 137962306a36Sopenharmony_ci 138062306a36Sopenharmony_ci qp->transport = MLX; 138162306a36Sopenharmony_ci err = mthca_set_qp_size(dev, cap, pd, qp); 138262306a36Sopenharmony_ci if (err) 138362306a36Sopenharmony_ci return err; 138462306a36Sopenharmony_ci 138562306a36Sopenharmony_ci qp->sqp->header_buf_size = qp->sq.max * MTHCA_UD_HEADER_SIZE; 138662306a36Sopenharmony_ci qp->sqp->header_buf = 138762306a36Sopenharmony_ci dma_alloc_coherent(&dev->pdev->dev, qp->sqp->header_buf_size, 138862306a36Sopenharmony_ci &qp->sqp->header_dma, GFP_KERNEL); 138962306a36Sopenharmony_ci if (!qp->sqp->header_buf) 139062306a36Sopenharmony_ci return -ENOMEM; 139162306a36Sopenharmony_ci 139262306a36Sopenharmony_ci spin_lock_irq(&dev->qp_table.lock); 139362306a36Sopenharmony_ci if (mthca_array_get(&dev->qp_table.qp, mqpn)) 139462306a36Sopenharmony_ci err = -EBUSY; 139562306a36Sopenharmony_ci else 139662306a36Sopenharmony_ci mthca_array_set(&dev->qp_table.qp, mqpn, qp); 139762306a36Sopenharmony_ci spin_unlock_irq(&dev->qp_table.lock); 139862306a36Sopenharmony_ci 139962306a36Sopenharmony_ci if (err) 140062306a36Sopenharmony_ci goto err_out; 140162306a36Sopenharmony_ci 140262306a36Sopenharmony_ci qp->port = port; 140362306a36Sopenharmony_ci qp->qpn = mqpn; 140462306a36Sopenharmony_ci qp->transport = MLX; 140562306a36Sopenharmony_ci 140662306a36Sopenharmony_ci err = mthca_alloc_qp_common(dev, pd, send_cq, recv_cq, 140762306a36Sopenharmony_ci send_policy, qp, udata); 140862306a36Sopenharmony_ci if (err) 140962306a36Sopenharmony_ci goto err_out_free; 141062306a36Sopenharmony_ci 141162306a36Sopenharmony_ci atomic_inc(&pd->sqp_count); 141262306a36Sopenharmony_ci 141362306a36Sopenharmony_ci return 0; 141462306a36Sopenharmony_ci 141562306a36Sopenharmony_ci err_out_free: 141662306a36Sopenharmony_ci /* 141762306a36Sopenharmony_ci * Lock CQs here, so that CQ polling code can do QP lookup 141862306a36Sopenharmony_ci * without taking a lock. 141962306a36Sopenharmony_ci */ 142062306a36Sopenharmony_ci mthca_lock_cqs(send_cq, recv_cq); 142162306a36Sopenharmony_ci 142262306a36Sopenharmony_ci spin_lock(&dev->qp_table.lock); 142362306a36Sopenharmony_ci mthca_array_clear(&dev->qp_table.qp, mqpn); 142462306a36Sopenharmony_ci spin_unlock(&dev->qp_table.lock); 142562306a36Sopenharmony_ci 142662306a36Sopenharmony_ci mthca_unlock_cqs(send_cq, recv_cq); 142762306a36Sopenharmony_ci 142862306a36Sopenharmony_cierr_out: 142962306a36Sopenharmony_ci dma_free_coherent(&dev->pdev->dev, qp->sqp->header_buf_size, 143062306a36Sopenharmony_ci qp->sqp->header_buf, qp->sqp->header_dma); 143162306a36Sopenharmony_ci return err; 143262306a36Sopenharmony_ci} 143362306a36Sopenharmony_ci 143462306a36Sopenharmony_cistatic inline int get_qp_refcount(struct mthca_dev *dev, struct mthca_qp *qp) 143562306a36Sopenharmony_ci{ 143662306a36Sopenharmony_ci int c; 143762306a36Sopenharmony_ci 143862306a36Sopenharmony_ci spin_lock_irq(&dev->qp_table.lock); 143962306a36Sopenharmony_ci c = qp->refcount; 144062306a36Sopenharmony_ci spin_unlock_irq(&dev->qp_table.lock); 144162306a36Sopenharmony_ci 144262306a36Sopenharmony_ci return c; 144362306a36Sopenharmony_ci} 144462306a36Sopenharmony_ci 144562306a36Sopenharmony_civoid mthca_free_qp(struct mthca_dev *dev, 144662306a36Sopenharmony_ci struct mthca_qp *qp) 144762306a36Sopenharmony_ci{ 144862306a36Sopenharmony_ci struct mthca_cq *send_cq; 144962306a36Sopenharmony_ci struct mthca_cq *recv_cq; 145062306a36Sopenharmony_ci 145162306a36Sopenharmony_ci send_cq = to_mcq(qp->ibqp.send_cq); 145262306a36Sopenharmony_ci recv_cq = to_mcq(qp->ibqp.recv_cq); 145362306a36Sopenharmony_ci 145462306a36Sopenharmony_ci /* 145562306a36Sopenharmony_ci * Lock CQs here, so that CQ polling code can do QP lookup 145662306a36Sopenharmony_ci * without taking a lock. 145762306a36Sopenharmony_ci */ 145862306a36Sopenharmony_ci mthca_lock_cqs(send_cq, recv_cq); 145962306a36Sopenharmony_ci 146062306a36Sopenharmony_ci spin_lock(&dev->qp_table.lock); 146162306a36Sopenharmony_ci mthca_array_clear(&dev->qp_table.qp, 146262306a36Sopenharmony_ci qp->qpn & (dev->limits.num_qps - 1)); 146362306a36Sopenharmony_ci --qp->refcount; 146462306a36Sopenharmony_ci spin_unlock(&dev->qp_table.lock); 146562306a36Sopenharmony_ci 146662306a36Sopenharmony_ci mthca_unlock_cqs(send_cq, recv_cq); 146762306a36Sopenharmony_ci 146862306a36Sopenharmony_ci wait_event(qp->wait, !get_qp_refcount(dev, qp)); 146962306a36Sopenharmony_ci 147062306a36Sopenharmony_ci if (qp->state != IB_QPS_RESET) 147162306a36Sopenharmony_ci mthca_MODIFY_QP(dev, qp->state, IB_QPS_RESET, qp->qpn, 0, 147262306a36Sopenharmony_ci NULL, 0); 147362306a36Sopenharmony_ci 147462306a36Sopenharmony_ci /* 147562306a36Sopenharmony_ci * If this is a userspace QP, the buffers, MR, CQs and so on 147662306a36Sopenharmony_ci * will be cleaned up in userspace, so all we have to do is 147762306a36Sopenharmony_ci * unref the mem-free tables and free the QPN in our table. 147862306a36Sopenharmony_ci */ 147962306a36Sopenharmony_ci if (!qp->ibqp.uobject) { 148062306a36Sopenharmony_ci mthca_cq_clean(dev, recv_cq, qp->qpn, 148162306a36Sopenharmony_ci qp->ibqp.srq ? to_msrq(qp->ibqp.srq) : NULL); 148262306a36Sopenharmony_ci if (send_cq != recv_cq) 148362306a36Sopenharmony_ci mthca_cq_clean(dev, send_cq, qp->qpn, NULL); 148462306a36Sopenharmony_ci 148562306a36Sopenharmony_ci mthca_free_memfree(dev, qp); 148662306a36Sopenharmony_ci mthca_free_wqe_buf(dev, qp); 148762306a36Sopenharmony_ci } 148862306a36Sopenharmony_ci 148962306a36Sopenharmony_ci mthca_unmap_memfree(dev, qp); 149062306a36Sopenharmony_ci 149162306a36Sopenharmony_ci if (is_sqp(dev, qp)) { 149262306a36Sopenharmony_ci atomic_dec(&(to_mpd(qp->ibqp.pd)->sqp_count)); 149362306a36Sopenharmony_ci dma_free_coherent(&dev->pdev->dev, qp->sqp->header_buf_size, 149462306a36Sopenharmony_ci qp->sqp->header_buf, qp->sqp->header_dma); 149562306a36Sopenharmony_ci } else 149662306a36Sopenharmony_ci mthca_free(&dev->qp_table.alloc, qp->qpn); 149762306a36Sopenharmony_ci} 149862306a36Sopenharmony_ci 149962306a36Sopenharmony_ci/* Create UD header for an MLX send and build a data segment for it */ 150062306a36Sopenharmony_cistatic int build_mlx_header(struct mthca_dev *dev, struct mthca_qp *qp, int ind, 150162306a36Sopenharmony_ci const struct ib_ud_wr *wr, 150262306a36Sopenharmony_ci struct mthca_mlx_seg *mlx, 150362306a36Sopenharmony_ci struct mthca_data_seg *data) 150462306a36Sopenharmony_ci{ 150562306a36Sopenharmony_ci struct mthca_sqp *sqp = qp->sqp; 150662306a36Sopenharmony_ci int header_size; 150762306a36Sopenharmony_ci int err; 150862306a36Sopenharmony_ci u16 pkey; 150962306a36Sopenharmony_ci 151062306a36Sopenharmony_ci ib_ud_header_init(256, /* assume a MAD */ 1, 0, 0, 151162306a36Sopenharmony_ci mthca_ah_grh_present(to_mah(wr->ah)), 0, 0, 0, 151262306a36Sopenharmony_ci &sqp->ud_header); 151362306a36Sopenharmony_ci 151462306a36Sopenharmony_ci err = mthca_read_ah(dev, to_mah(wr->ah), &sqp->ud_header); 151562306a36Sopenharmony_ci if (err) 151662306a36Sopenharmony_ci return err; 151762306a36Sopenharmony_ci mlx->flags &= ~cpu_to_be32(MTHCA_NEXT_SOLICIT | 1); 151862306a36Sopenharmony_ci mlx->flags |= cpu_to_be32((!qp->ibqp.qp_num ? MTHCA_MLX_VL15 : 0) | 151962306a36Sopenharmony_ci (sqp->ud_header.lrh.destination_lid == 152062306a36Sopenharmony_ci IB_LID_PERMISSIVE ? MTHCA_MLX_SLR : 0) | 152162306a36Sopenharmony_ci (sqp->ud_header.lrh.service_level << 8)); 152262306a36Sopenharmony_ci mlx->rlid = sqp->ud_header.lrh.destination_lid; 152362306a36Sopenharmony_ci mlx->vcrc = 0; 152462306a36Sopenharmony_ci 152562306a36Sopenharmony_ci switch (wr->wr.opcode) { 152662306a36Sopenharmony_ci case IB_WR_SEND: 152762306a36Sopenharmony_ci sqp->ud_header.bth.opcode = IB_OPCODE_UD_SEND_ONLY; 152862306a36Sopenharmony_ci sqp->ud_header.immediate_present = 0; 152962306a36Sopenharmony_ci break; 153062306a36Sopenharmony_ci case IB_WR_SEND_WITH_IMM: 153162306a36Sopenharmony_ci sqp->ud_header.bth.opcode = IB_OPCODE_UD_SEND_ONLY_WITH_IMMEDIATE; 153262306a36Sopenharmony_ci sqp->ud_header.immediate_present = 1; 153362306a36Sopenharmony_ci sqp->ud_header.immediate_data = wr->wr.ex.imm_data; 153462306a36Sopenharmony_ci break; 153562306a36Sopenharmony_ci default: 153662306a36Sopenharmony_ci return -EINVAL; 153762306a36Sopenharmony_ci } 153862306a36Sopenharmony_ci 153962306a36Sopenharmony_ci sqp->ud_header.lrh.virtual_lane = !qp->ibqp.qp_num ? 15 : 0; 154062306a36Sopenharmony_ci if (sqp->ud_header.lrh.destination_lid == IB_LID_PERMISSIVE) 154162306a36Sopenharmony_ci sqp->ud_header.lrh.source_lid = IB_LID_PERMISSIVE; 154262306a36Sopenharmony_ci sqp->ud_header.bth.solicited_event = !!(wr->wr.send_flags & IB_SEND_SOLICITED); 154362306a36Sopenharmony_ci if (!qp->ibqp.qp_num) 154462306a36Sopenharmony_ci ib_get_cached_pkey(&dev->ib_dev, qp->port, sqp->pkey_index, 154562306a36Sopenharmony_ci &pkey); 154662306a36Sopenharmony_ci else 154762306a36Sopenharmony_ci ib_get_cached_pkey(&dev->ib_dev, qp->port, wr->pkey_index, 154862306a36Sopenharmony_ci &pkey); 154962306a36Sopenharmony_ci sqp->ud_header.bth.pkey = cpu_to_be16(pkey); 155062306a36Sopenharmony_ci sqp->ud_header.bth.destination_qpn = cpu_to_be32(wr->remote_qpn); 155162306a36Sopenharmony_ci sqp->ud_header.bth.psn = cpu_to_be32((sqp->send_psn++) & ((1 << 24) - 1)); 155262306a36Sopenharmony_ci sqp->ud_header.deth.qkey = cpu_to_be32(wr->remote_qkey & 0x80000000 ? 155362306a36Sopenharmony_ci sqp->qkey : wr->remote_qkey); 155462306a36Sopenharmony_ci sqp->ud_header.deth.source_qpn = cpu_to_be32(qp->ibqp.qp_num); 155562306a36Sopenharmony_ci 155662306a36Sopenharmony_ci header_size = ib_ud_header_pack(&sqp->ud_header, 155762306a36Sopenharmony_ci sqp->header_buf + 155862306a36Sopenharmony_ci ind * MTHCA_UD_HEADER_SIZE); 155962306a36Sopenharmony_ci 156062306a36Sopenharmony_ci data->byte_count = cpu_to_be32(header_size); 156162306a36Sopenharmony_ci data->lkey = cpu_to_be32(to_mpd(qp->ibqp.pd)->ntmr.ibmr.lkey); 156262306a36Sopenharmony_ci data->addr = cpu_to_be64(sqp->header_dma + 156362306a36Sopenharmony_ci ind * MTHCA_UD_HEADER_SIZE); 156462306a36Sopenharmony_ci 156562306a36Sopenharmony_ci return 0; 156662306a36Sopenharmony_ci} 156762306a36Sopenharmony_ci 156862306a36Sopenharmony_cistatic inline int mthca_wq_overflow(struct mthca_wq *wq, int nreq, 156962306a36Sopenharmony_ci struct ib_cq *ib_cq) 157062306a36Sopenharmony_ci{ 157162306a36Sopenharmony_ci unsigned cur; 157262306a36Sopenharmony_ci struct mthca_cq *cq; 157362306a36Sopenharmony_ci 157462306a36Sopenharmony_ci cur = wq->head - wq->tail; 157562306a36Sopenharmony_ci if (likely(cur + nreq < wq->max)) 157662306a36Sopenharmony_ci return 0; 157762306a36Sopenharmony_ci 157862306a36Sopenharmony_ci cq = to_mcq(ib_cq); 157962306a36Sopenharmony_ci spin_lock(&cq->lock); 158062306a36Sopenharmony_ci cur = wq->head - wq->tail; 158162306a36Sopenharmony_ci spin_unlock(&cq->lock); 158262306a36Sopenharmony_ci 158362306a36Sopenharmony_ci return cur + nreq >= wq->max; 158462306a36Sopenharmony_ci} 158562306a36Sopenharmony_ci 158662306a36Sopenharmony_cistatic __always_inline void set_raddr_seg(struct mthca_raddr_seg *rseg, 158762306a36Sopenharmony_ci u64 remote_addr, u32 rkey) 158862306a36Sopenharmony_ci{ 158962306a36Sopenharmony_ci rseg->raddr = cpu_to_be64(remote_addr); 159062306a36Sopenharmony_ci rseg->rkey = cpu_to_be32(rkey); 159162306a36Sopenharmony_ci rseg->reserved = 0; 159262306a36Sopenharmony_ci} 159362306a36Sopenharmony_ci 159462306a36Sopenharmony_cistatic __always_inline void set_atomic_seg(struct mthca_atomic_seg *aseg, 159562306a36Sopenharmony_ci const struct ib_atomic_wr *wr) 159662306a36Sopenharmony_ci{ 159762306a36Sopenharmony_ci if (wr->wr.opcode == IB_WR_ATOMIC_CMP_AND_SWP) { 159862306a36Sopenharmony_ci aseg->swap_add = cpu_to_be64(wr->swap); 159962306a36Sopenharmony_ci aseg->compare = cpu_to_be64(wr->compare_add); 160062306a36Sopenharmony_ci } else { 160162306a36Sopenharmony_ci aseg->swap_add = cpu_to_be64(wr->compare_add); 160262306a36Sopenharmony_ci aseg->compare = 0; 160362306a36Sopenharmony_ci } 160462306a36Sopenharmony_ci 160562306a36Sopenharmony_ci} 160662306a36Sopenharmony_ci 160762306a36Sopenharmony_cistatic void set_tavor_ud_seg(struct mthca_tavor_ud_seg *useg, 160862306a36Sopenharmony_ci const struct ib_ud_wr *wr) 160962306a36Sopenharmony_ci{ 161062306a36Sopenharmony_ci useg->lkey = cpu_to_be32(to_mah(wr->ah)->key); 161162306a36Sopenharmony_ci useg->av_addr = cpu_to_be64(to_mah(wr->ah)->avdma); 161262306a36Sopenharmony_ci useg->dqpn = cpu_to_be32(wr->remote_qpn); 161362306a36Sopenharmony_ci useg->qkey = cpu_to_be32(wr->remote_qkey); 161462306a36Sopenharmony_ci 161562306a36Sopenharmony_ci} 161662306a36Sopenharmony_ci 161762306a36Sopenharmony_cistatic void set_arbel_ud_seg(struct mthca_arbel_ud_seg *useg, 161862306a36Sopenharmony_ci const struct ib_ud_wr *wr) 161962306a36Sopenharmony_ci{ 162062306a36Sopenharmony_ci memcpy(useg->av, to_mah(wr->ah)->av, MTHCA_AV_SIZE); 162162306a36Sopenharmony_ci useg->dqpn = cpu_to_be32(wr->remote_qpn); 162262306a36Sopenharmony_ci useg->qkey = cpu_to_be32(wr->remote_qkey); 162362306a36Sopenharmony_ci} 162462306a36Sopenharmony_ci 162562306a36Sopenharmony_ciint mthca_tavor_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr, 162662306a36Sopenharmony_ci const struct ib_send_wr **bad_wr) 162762306a36Sopenharmony_ci{ 162862306a36Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 162962306a36Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 163062306a36Sopenharmony_ci void *wqe; 163162306a36Sopenharmony_ci void *prev_wqe; 163262306a36Sopenharmony_ci unsigned long flags; 163362306a36Sopenharmony_ci int err = 0; 163462306a36Sopenharmony_ci int nreq; 163562306a36Sopenharmony_ci int i; 163662306a36Sopenharmony_ci int size; 163762306a36Sopenharmony_ci /* 163862306a36Sopenharmony_ci * f0 and size0 are only used if nreq != 0, and they will 163962306a36Sopenharmony_ci * always be initialized the first time through the main loop 164062306a36Sopenharmony_ci * before nreq is incremented. So nreq cannot become non-zero 164162306a36Sopenharmony_ci * without initializing f0 and size0, and they are in fact 164262306a36Sopenharmony_ci * never used uninitialized. 164362306a36Sopenharmony_ci */ 164462306a36Sopenharmony_ci int size0; 164562306a36Sopenharmony_ci u32 f0; 164662306a36Sopenharmony_ci int ind; 164762306a36Sopenharmony_ci u8 op0 = 0; 164862306a36Sopenharmony_ci 164962306a36Sopenharmony_ci spin_lock_irqsave(&qp->sq.lock, flags); 165062306a36Sopenharmony_ci 165162306a36Sopenharmony_ci /* XXX check that state is OK to post send */ 165262306a36Sopenharmony_ci 165362306a36Sopenharmony_ci ind = qp->sq.next_ind; 165462306a36Sopenharmony_ci 165562306a36Sopenharmony_ci for (nreq = 0; wr; ++nreq, wr = wr->next) { 165662306a36Sopenharmony_ci if (mthca_wq_overflow(&qp->sq, nreq, qp->ibqp.send_cq)) { 165762306a36Sopenharmony_ci mthca_err(dev, "SQ %06x full (%u head, %u tail," 165862306a36Sopenharmony_ci " %d max, %d nreq)\n", qp->qpn, 165962306a36Sopenharmony_ci qp->sq.head, qp->sq.tail, 166062306a36Sopenharmony_ci qp->sq.max, nreq); 166162306a36Sopenharmony_ci err = -ENOMEM; 166262306a36Sopenharmony_ci *bad_wr = wr; 166362306a36Sopenharmony_ci goto out; 166462306a36Sopenharmony_ci } 166562306a36Sopenharmony_ci 166662306a36Sopenharmony_ci wqe = get_send_wqe(qp, ind); 166762306a36Sopenharmony_ci prev_wqe = qp->sq.last; 166862306a36Sopenharmony_ci qp->sq.last = wqe; 166962306a36Sopenharmony_ci 167062306a36Sopenharmony_ci ((struct mthca_next_seg *) wqe)->nda_op = 0; 167162306a36Sopenharmony_ci ((struct mthca_next_seg *) wqe)->ee_nds = 0; 167262306a36Sopenharmony_ci ((struct mthca_next_seg *) wqe)->flags = 167362306a36Sopenharmony_ci ((wr->send_flags & IB_SEND_SIGNALED) ? 167462306a36Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_CQ_UPDATE) : 0) | 167562306a36Sopenharmony_ci ((wr->send_flags & IB_SEND_SOLICITED) ? 167662306a36Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_SOLICIT) : 0) | 167762306a36Sopenharmony_ci cpu_to_be32(1); 167862306a36Sopenharmony_ci if (wr->opcode == IB_WR_SEND_WITH_IMM || 167962306a36Sopenharmony_ci wr->opcode == IB_WR_RDMA_WRITE_WITH_IMM) 168062306a36Sopenharmony_ci ((struct mthca_next_seg *) wqe)->imm = wr->ex.imm_data; 168162306a36Sopenharmony_ci 168262306a36Sopenharmony_ci wqe += sizeof (struct mthca_next_seg); 168362306a36Sopenharmony_ci size = sizeof (struct mthca_next_seg) / 16; 168462306a36Sopenharmony_ci 168562306a36Sopenharmony_ci switch (qp->transport) { 168662306a36Sopenharmony_ci case RC: 168762306a36Sopenharmony_ci switch (wr->opcode) { 168862306a36Sopenharmony_ci case IB_WR_ATOMIC_CMP_AND_SWP: 168962306a36Sopenharmony_ci case IB_WR_ATOMIC_FETCH_AND_ADD: 169062306a36Sopenharmony_ci set_raddr_seg(wqe, atomic_wr(wr)->remote_addr, 169162306a36Sopenharmony_ci atomic_wr(wr)->rkey); 169262306a36Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 169362306a36Sopenharmony_ci 169462306a36Sopenharmony_ci set_atomic_seg(wqe, atomic_wr(wr)); 169562306a36Sopenharmony_ci wqe += sizeof (struct mthca_atomic_seg); 169662306a36Sopenharmony_ci size += (sizeof (struct mthca_raddr_seg) + 169762306a36Sopenharmony_ci sizeof (struct mthca_atomic_seg)) / 16; 169862306a36Sopenharmony_ci break; 169962306a36Sopenharmony_ci 170062306a36Sopenharmony_ci case IB_WR_RDMA_WRITE: 170162306a36Sopenharmony_ci case IB_WR_RDMA_WRITE_WITH_IMM: 170262306a36Sopenharmony_ci case IB_WR_RDMA_READ: 170362306a36Sopenharmony_ci set_raddr_seg(wqe, rdma_wr(wr)->remote_addr, 170462306a36Sopenharmony_ci rdma_wr(wr)->rkey); 170562306a36Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 170662306a36Sopenharmony_ci size += sizeof (struct mthca_raddr_seg) / 16; 170762306a36Sopenharmony_ci break; 170862306a36Sopenharmony_ci 170962306a36Sopenharmony_ci default: 171062306a36Sopenharmony_ci /* No extra segments required for sends */ 171162306a36Sopenharmony_ci break; 171262306a36Sopenharmony_ci } 171362306a36Sopenharmony_ci 171462306a36Sopenharmony_ci break; 171562306a36Sopenharmony_ci 171662306a36Sopenharmony_ci case UC: 171762306a36Sopenharmony_ci switch (wr->opcode) { 171862306a36Sopenharmony_ci case IB_WR_RDMA_WRITE: 171962306a36Sopenharmony_ci case IB_WR_RDMA_WRITE_WITH_IMM: 172062306a36Sopenharmony_ci set_raddr_seg(wqe, rdma_wr(wr)->remote_addr, 172162306a36Sopenharmony_ci rdma_wr(wr)->rkey); 172262306a36Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 172362306a36Sopenharmony_ci size += sizeof (struct mthca_raddr_seg) / 16; 172462306a36Sopenharmony_ci break; 172562306a36Sopenharmony_ci 172662306a36Sopenharmony_ci default: 172762306a36Sopenharmony_ci /* No extra segments required for sends */ 172862306a36Sopenharmony_ci break; 172962306a36Sopenharmony_ci } 173062306a36Sopenharmony_ci 173162306a36Sopenharmony_ci break; 173262306a36Sopenharmony_ci 173362306a36Sopenharmony_ci case UD: 173462306a36Sopenharmony_ci set_tavor_ud_seg(wqe, ud_wr(wr)); 173562306a36Sopenharmony_ci wqe += sizeof (struct mthca_tavor_ud_seg); 173662306a36Sopenharmony_ci size += sizeof (struct mthca_tavor_ud_seg) / 16; 173762306a36Sopenharmony_ci break; 173862306a36Sopenharmony_ci 173962306a36Sopenharmony_ci case MLX: 174062306a36Sopenharmony_ci err = build_mlx_header( 174162306a36Sopenharmony_ci dev, qp, ind, ud_wr(wr), 174262306a36Sopenharmony_ci wqe - sizeof(struct mthca_next_seg), wqe); 174362306a36Sopenharmony_ci if (err) { 174462306a36Sopenharmony_ci *bad_wr = wr; 174562306a36Sopenharmony_ci goto out; 174662306a36Sopenharmony_ci } 174762306a36Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 174862306a36Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 174962306a36Sopenharmony_ci break; 175062306a36Sopenharmony_ci } 175162306a36Sopenharmony_ci 175262306a36Sopenharmony_ci if (wr->num_sge > qp->sq.max_gs) { 175362306a36Sopenharmony_ci mthca_err(dev, "too many gathers\n"); 175462306a36Sopenharmony_ci err = -EINVAL; 175562306a36Sopenharmony_ci *bad_wr = wr; 175662306a36Sopenharmony_ci goto out; 175762306a36Sopenharmony_ci } 175862306a36Sopenharmony_ci 175962306a36Sopenharmony_ci for (i = 0; i < wr->num_sge; ++i) { 176062306a36Sopenharmony_ci mthca_set_data_seg(wqe, wr->sg_list + i); 176162306a36Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 176262306a36Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 176362306a36Sopenharmony_ci } 176462306a36Sopenharmony_ci 176562306a36Sopenharmony_ci /* Add one more inline data segment for ICRC */ 176662306a36Sopenharmony_ci if (qp->transport == MLX) { 176762306a36Sopenharmony_ci ((struct mthca_data_seg *) wqe)->byte_count = 176862306a36Sopenharmony_ci cpu_to_be32((1 << 31) | 4); 176962306a36Sopenharmony_ci ((u32 *) wqe)[1] = 0; 177062306a36Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 177162306a36Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 177262306a36Sopenharmony_ci } 177362306a36Sopenharmony_ci 177462306a36Sopenharmony_ci qp->wrid[ind + qp->rq.max] = wr->wr_id; 177562306a36Sopenharmony_ci 177662306a36Sopenharmony_ci if (wr->opcode >= ARRAY_SIZE(mthca_opcode)) { 177762306a36Sopenharmony_ci mthca_err(dev, "opcode invalid\n"); 177862306a36Sopenharmony_ci err = -EINVAL; 177962306a36Sopenharmony_ci *bad_wr = wr; 178062306a36Sopenharmony_ci goto out; 178162306a36Sopenharmony_ci } 178262306a36Sopenharmony_ci 178362306a36Sopenharmony_ci ((struct mthca_next_seg *) prev_wqe)->nda_op = 178462306a36Sopenharmony_ci cpu_to_be32(((ind << qp->sq.wqe_shift) + 178562306a36Sopenharmony_ci qp->send_wqe_offset) | 178662306a36Sopenharmony_ci mthca_opcode[wr->opcode]); 178762306a36Sopenharmony_ci wmb(); 178862306a36Sopenharmony_ci ((struct mthca_next_seg *) prev_wqe)->ee_nds = 178962306a36Sopenharmony_ci cpu_to_be32((nreq ? 0 : MTHCA_NEXT_DBD) | size | 179062306a36Sopenharmony_ci ((wr->send_flags & IB_SEND_FENCE) ? 179162306a36Sopenharmony_ci MTHCA_NEXT_FENCE : 0)); 179262306a36Sopenharmony_ci 179362306a36Sopenharmony_ci if (!nreq) { 179462306a36Sopenharmony_ci size0 = size; 179562306a36Sopenharmony_ci op0 = mthca_opcode[wr->opcode]; 179662306a36Sopenharmony_ci f0 = wr->send_flags & IB_SEND_FENCE ? 179762306a36Sopenharmony_ci MTHCA_SEND_DOORBELL_FENCE : 0; 179862306a36Sopenharmony_ci } 179962306a36Sopenharmony_ci 180062306a36Sopenharmony_ci ++ind; 180162306a36Sopenharmony_ci if (unlikely(ind >= qp->sq.max)) 180262306a36Sopenharmony_ci ind -= qp->sq.max; 180362306a36Sopenharmony_ci } 180462306a36Sopenharmony_ci 180562306a36Sopenharmony_ciout: 180662306a36Sopenharmony_ci if (likely(nreq)) { 180762306a36Sopenharmony_ci wmb(); 180862306a36Sopenharmony_ci 180962306a36Sopenharmony_ci mthca_write64(((qp->sq.next_ind << qp->sq.wqe_shift) + 181062306a36Sopenharmony_ci qp->send_wqe_offset) | f0 | op0, 181162306a36Sopenharmony_ci (qp->qpn << 8) | size0, 181262306a36Sopenharmony_ci dev->kar + MTHCA_SEND_DOORBELL, 181362306a36Sopenharmony_ci MTHCA_GET_DOORBELL_LOCK(&dev->doorbell_lock)); 181462306a36Sopenharmony_ci } 181562306a36Sopenharmony_ci 181662306a36Sopenharmony_ci qp->sq.next_ind = ind; 181762306a36Sopenharmony_ci qp->sq.head += nreq; 181862306a36Sopenharmony_ci 181962306a36Sopenharmony_ci spin_unlock_irqrestore(&qp->sq.lock, flags); 182062306a36Sopenharmony_ci return err; 182162306a36Sopenharmony_ci} 182262306a36Sopenharmony_ci 182362306a36Sopenharmony_ciint mthca_tavor_post_receive(struct ib_qp *ibqp, const struct ib_recv_wr *wr, 182462306a36Sopenharmony_ci const struct ib_recv_wr **bad_wr) 182562306a36Sopenharmony_ci{ 182662306a36Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 182762306a36Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 182862306a36Sopenharmony_ci unsigned long flags; 182962306a36Sopenharmony_ci int err = 0; 183062306a36Sopenharmony_ci int nreq; 183162306a36Sopenharmony_ci int i; 183262306a36Sopenharmony_ci int size; 183362306a36Sopenharmony_ci /* 183462306a36Sopenharmony_ci * size0 is only used if nreq != 0, and it will always be 183562306a36Sopenharmony_ci * initialized the first time through the main loop before 183662306a36Sopenharmony_ci * nreq is incremented. So nreq cannot become non-zero 183762306a36Sopenharmony_ci * without initializing size0, and it is in fact never used 183862306a36Sopenharmony_ci * uninitialized. 183962306a36Sopenharmony_ci */ 184062306a36Sopenharmony_ci int size0; 184162306a36Sopenharmony_ci int ind; 184262306a36Sopenharmony_ci void *wqe; 184362306a36Sopenharmony_ci void *prev_wqe; 184462306a36Sopenharmony_ci 184562306a36Sopenharmony_ci spin_lock_irqsave(&qp->rq.lock, flags); 184662306a36Sopenharmony_ci 184762306a36Sopenharmony_ci /* XXX check that state is OK to post receive */ 184862306a36Sopenharmony_ci 184962306a36Sopenharmony_ci ind = qp->rq.next_ind; 185062306a36Sopenharmony_ci 185162306a36Sopenharmony_ci for (nreq = 0; wr; wr = wr->next) { 185262306a36Sopenharmony_ci if (mthca_wq_overflow(&qp->rq, nreq, qp->ibqp.recv_cq)) { 185362306a36Sopenharmony_ci mthca_err(dev, "RQ %06x full (%u head, %u tail," 185462306a36Sopenharmony_ci " %d max, %d nreq)\n", qp->qpn, 185562306a36Sopenharmony_ci qp->rq.head, qp->rq.tail, 185662306a36Sopenharmony_ci qp->rq.max, nreq); 185762306a36Sopenharmony_ci err = -ENOMEM; 185862306a36Sopenharmony_ci *bad_wr = wr; 185962306a36Sopenharmony_ci goto out; 186062306a36Sopenharmony_ci } 186162306a36Sopenharmony_ci 186262306a36Sopenharmony_ci wqe = get_recv_wqe(qp, ind); 186362306a36Sopenharmony_ci prev_wqe = qp->rq.last; 186462306a36Sopenharmony_ci qp->rq.last = wqe; 186562306a36Sopenharmony_ci 186662306a36Sopenharmony_ci ((struct mthca_next_seg *) wqe)->ee_nds = 186762306a36Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_DBD); 186862306a36Sopenharmony_ci ((struct mthca_next_seg *) wqe)->flags = 0; 186962306a36Sopenharmony_ci 187062306a36Sopenharmony_ci wqe += sizeof (struct mthca_next_seg); 187162306a36Sopenharmony_ci size = sizeof (struct mthca_next_seg) / 16; 187262306a36Sopenharmony_ci 187362306a36Sopenharmony_ci if (unlikely(wr->num_sge > qp->rq.max_gs)) { 187462306a36Sopenharmony_ci err = -EINVAL; 187562306a36Sopenharmony_ci *bad_wr = wr; 187662306a36Sopenharmony_ci goto out; 187762306a36Sopenharmony_ci } 187862306a36Sopenharmony_ci 187962306a36Sopenharmony_ci for (i = 0; i < wr->num_sge; ++i) { 188062306a36Sopenharmony_ci mthca_set_data_seg(wqe, wr->sg_list + i); 188162306a36Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 188262306a36Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 188362306a36Sopenharmony_ci } 188462306a36Sopenharmony_ci 188562306a36Sopenharmony_ci qp->wrid[ind] = wr->wr_id; 188662306a36Sopenharmony_ci 188762306a36Sopenharmony_ci ((struct mthca_next_seg *) prev_wqe)->ee_nds = 188862306a36Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_DBD | size); 188962306a36Sopenharmony_ci 189062306a36Sopenharmony_ci if (!nreq) 189162306a36Sopenharmony_ci size0 = size; 189262306a36Sopenharmony_ci 189362306a36Sopenharmony_ci ++ind; 189462306a36Sopenharmony_ci if (unlikely(ind >= qp->rq.max)) 189562306a36Sopenharmony_ci ind -= qp->rq.max; 189662306a36Sopenharmony_ci 189762306a36Sopenharmony_ci ++nreq; 189862306a36Sopenharmony_ci if (unlikely(nreq == MTHCA_TAVOR_MAX_WQES_PER_RECV_DB)) { 189962306a36Sopenharmony_ci nreq = 0; 190062306a36Sopenharmony_ci 190162306a36Sopenharmony_ci wmb(); 190262306a36Sopenharmony_ci 190362306a36Sopenharmony_ci mthca_write64((qp->rq.next_ind << qp->rq.wqe_shift) | size0, 190462306a36Sopenharmony_ci qp->qpn << 8, dev->kar + MTHCA_RECEIVE_DOORBELL, 190562306a36Sopenharmony_ci MTHCA_GET_DOORBELL_LOCK(&dev->doorbell_lock)); 190662306a36Sopenharmony_ci 190762306a36Sopenharmony_ci qp->rq.next_ind = ind; 190862306a36Sopenharmony_ci qp->rq.head += MTHCA_TAVOR_MAX_WQES_PER_RECV_DB; 190962306a36Sopenharmony_ci } 191062306a36Sopenharmony_ci } 191162306a36Sopenharmony_ci 191262306a36Sopenharmony_ciout: 191362306a36Sopenharmony_ci if (likely(nreq)) { 191462306a36Sopenharmony_ci wmb(); 191562306a36Sopenharmony_ci 191662306a36Sopenharmony_ci mthca_write64((qp->rq.next_ind << qp->rq.wqe_shift) | size0, 191762306a36Sopenharmony_ci qp->qpn << 8 | nreq, dev->kar + MTHCA_RECEIVE_DOORBELL, 191862306a36Sopenharmony_ci MTHCA_GET_DOORBELL_LOCK(&dev->doorbell_lock)); 191962306a36Sopenharmony_ci } 192062306a36Sopenharmony_ci 192162306a36Sopenharmony_ci qp->rq.next_ind = ind; 192262306a36Sopenharmony_ci qp->rq.head += nreq; 192362306a36Sopenharmony_ci 192462306a36Sopenharmony_ci spin_unlock_irqrestore(&qp->rq.lock, flags); 192562306a36Sopenharmony_ci return err; 192662306a36Sopenharmony_ci} 192762306a36Sopenharmony_ci 192862306a36Sopenharmony_ciint mthca_arbel_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr, 192962306a36Sopenharmony_ci const struct ib_send_wr **bad_wr) 193062306a36Sopenharmony_ci{ 193162306a36Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 193262306a36Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 193362306a36Sopenharmony_ci u32 dbhi; 193462306a36Sopenharmony_ci void *wqe; 193562306a36Sopenharmony_ci void *prev_wqe; 193662306a36Sopenharmony_ci unsigned long flags; 193762306a36Sopenharmony_ci int err = 0; 193862306a36Sopenharmony_ci int nreq; 193962306a36Sopenharmony_ci int i; 194062306a36Sopenharmony_ci int size; 194162306a36Sopenharmony_ci /* 194262306a36Sopenharmony_ci * f0 and size0 are only used if nreq != 0, and they will 194362306a36Sopenharmony_ci * always be initialized the first time through the main loop 194462306a36Sopenharmony_ci * before nreq is incremented. So nreq cannot become non-zero 194562306a36Sopenharmony_ci * without initializing f0 and size0, and they are in fact 194662306a36Sopenharmony_ci * never used uninitialized. 194762306a36Sopenharmony_ci */ 194862306a36Sopenharmony_ci int size0; 194962306a36Sopenharmony_ci u32 f0; 195062306a36Sopenharmony_ci int ind; 195162306a36Sopenharmony_ci u8 op0 = 0; 195262306a36Sopenharmony_ci 195362306a36Sopenharmony_ci spin_lock_irqsave(&qp->sq.lock, flags); 195462306a36Sopenharmony_ci 195562306a36Sopenharmony_ci /* XXX check that state is OK to post send */ 195662306a36Sopenharmony_ci 195762306a36Sopenharmony_ci ind = qp->sq.head & (qp->sq.max - 1); 195862306a36Sopenharmony_ci 195962306a36Sopenharmony_ci for (nreq = 0; wr; ++nreq, wr = wr->next) { 196062306a36Sopenharmony_ci if (unlikely(nreq == MTHCA_ARBEL_MAX_WQES_PER_SEND_DB)) { 196162306a36Sopenharmony_ci nreq = 0; 196262306a36Sopenharmony_ci 196362306a36Sopenharmony_ci dbhi = (MTHCA_ARBEL_MAX_WQES_PER_SEND_DB << 24) | 196462306a36Sopenharmony_ci ((qp->sq.head & 0xffff) << 8) | f0 | op0; 196562306a36Sopenharmony_ci 196662306a36Sopenharmony_ci qp->sq.head += MTHCA_ARBEL_MAX_WQES_PER_SEND_DB; 196762306a36Sopenharmony_ci 196862306a36Sopenharmony_ci /* 196962306a36Sopenharmony_ci * Make sure that descriptors are written before 197062306a36Sopenharmony_ci * doorbell record. 197162306a36Sopenharmony_ci */ 197262306a36Sopenharmony_ci wmb(); 197362306a36Sopenharmony_ci *qp->sq.db = cpu_to_be32(qp->sq.head & 0xffff); 197462306a36Sopenharmony_ci 197562306a36Sopenharmony_ci /* 197662306a36Sopenharmony_ci * Make sure doorbell record is written before we 197762306a36Sopenharmony_ci * write MMIO send doorbell. 197862306a36Sopenharmony_ci */ 197962306a36Sopenharmony_ci wmb(); 198062306a36Sopenharmony_ci 198162306a36Sopenharmony_ci mthca_write64(dbhi, (qp->qpn << 8) | size0, 198262306a36Sopenharmony_ci dev->kar + MTHCA_SEND_DOORBELL, 198362306a36Sopenharmony_ci MTHCA_GET_DOORBELL_LOCK(&dev->doorbell_lock)); 198462306a36Sopenharmony_ci } 198562306a36Sopenharmony_ci 198662306a36Sopenharmony_ci if (mthca_wq_overflow(&qp->sq, nreq, qp->ibqp.send_cq)) { 198762306a36Sopenharmony_ci mthca_err(dev, "SQ %06x full (%u head, %u tail," 198862306a36Sopenharmony_ci " %d max, %d nreq)\n", qp->qpn, 198962306a36Sopenharmony_ci qp->sq.head, qp->sq.tail, 199062306a36Sopenharmony_ci qp->sq.max, nreq); 199162306a36Sopenharmony_ci err = -ENOMEM; 199262306a36Sopenharmony_ci *bad_wr = wr; 199362306a36Sopenharmony_ci goto out; 199462306a36Sopenharmony_ci } 199562306a36Sopenharmony_ci 199662306a36Sopenharmony_ci wqe = get_send_wqe(qp, ind); 199762306a36Sopenharmony_ci prev_wqe = qp->sq.last; 199862306a36Sopenharmony_ci qp->sq.last = wqe; 199962306a36Sopenharmony_ci 200062306a36Sopenharmony_ci ((struct mthca_next_seg *) wqe)->flags = 200162306a36Sopenharmony_ci ((wr->send_flags & IB_SEND_SIGNALED) ? 200262306a36Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_CQ_UPDATE) : 0) | 200362306a36Sopenharmony_ci ((wr->send_flags & IB_SEND_SOLICITED) ? 200462306a36Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_SOLICIT) : 0) | 200562306a36Sopenharmony_ci ((wr->send_flags & IB_SEND_IP_CSUM) ? 200662306a36Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_IP_CSUM | MTHCA_NEXT_TCP_UDP_CSUM) : 0) | 200762306a36Sopenharmony_ci cpu_to_be32(1); 200862306a36Sopenharmony_ci if (wr->opcode == IB_WR_SEND_WITH_IMM || 200962306a36Sopenharmony_ci wr->opcode == IB_WR_RDMA_WRITE_WITH_IMM) 201062306a36Sopenharmony_ci ((struct mthca_next_seg *) wqe)->imm = wr->ex.imm_data; 201162306a36Sopenharmony_ci 201262306a36Sopenharmony_ci wqe += sizeof (struct mthca_next_seg); 201362306a36Sopenharmony_ci size = sizeof (struct mthca_next_seg) / 16; 201462306a36Sopenharmony_ci 201562306a36Sopenharmony_ci switch (qp->transport) { 201662306a36Sopenharmony_ci case RC: 201762306a36Sopenharmony_ci switch (wr->opcode) { 201862306a36Sopenharmony_ci case IB_WR_ATOMIC_CMP_AND_SWP: 201962306a36Sopenharmony_ci case IB_WR_ATOMIC_FETCH_AND_ADD: 202062306a36Sopenharmony_ci set_raddr_seg(wqe, atomic_wr(wr)->remote_addr, 202162306a36Sopenharmony_ci atomic_wr(wr)->rkey); 202262306a36Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 202362306a36Sopenharmony_ci 202462306a36Sopenharmony_ci set_atomic_seg(wqe, atomic_wr(wr)); 202562306a36Sopenharmony_ci wqe += sizeof (struct mthca_atomic_seg); 202662306a36Sopenharmony_ci size += (sizeof (struct mthca_raddr_seg) + 202762306a36Sopenharmony_ci sizeof (struct mthca_atomic_seg)) / 16; 202862306a36Sopenharmony_ci break; 202962306a36Sopenharmony_ci 203062306a36Sopenharmony_ci case IB_WR_RDMA_READ: 203162306a36Sopenharmony_ci case IB_WR_RDMA_WRITE: 203262306a36Sopenharmony_ci case IB_WR_RDMA_WRITE_WITH_IMM: 203362306a36Sopenharmony_ci set_raddr_seg(wqe, rdma_wr(wr)->remote_addr, 203462306a36Sopenharmony_ci rdma_wr(wr)->rkey); 203562306a36Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 203662306a36Sopenharmony_ci size += sizeof (struct mthca_raddr_seg) / 16; 203762306a36Sopenharmony_ci break; 203862306a36Sopenharmony_ci 203962306a36Sopenharmony_ci default: 204062306a36Sopenharmony_ci /* No extra segments required for sends */ 204162306a36Sopenharmony_ci break; 204262306a36Sopenharmony_ci } 204362306a36Sopenharmony_ci 204462306a36Sopenharmony_ci break; 204562306a36Sopenharmony_ci 204662306a36Sopenharmony_ci case UC: 204762306a36Sopenharmony_ci switch (wr->opcode) { 204862306a36Sopenharmony_ci case IB_WR_RDMA_WRITE: 204962306a36Sopenharmony_ci case IB_WR_RDMA_WRITE_WITH_IMM: 205062306a36Sopenharmony_ci set_raddr_seg(wqe, rdma_wr(wr)->remote_addr, 205162306a36Sopenharmony_ci rdma_wr(wr)->rkey); 205262306a36Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 205362306a36Sopenharmony_ci size += sizeof (struct mthca_raddr_seg) / 16; 205462306a36Sopenharmony_ci break; 205562306a36Sopenharmony_ci 205662306a36Sopenharmony_ci default: 205762306a36Sopenharmony_ci /* No extra segments required for sends */ 205862306a36Sopenharmony_ci break; 205962306a36Sopenharmony_ci } 206062306a36Sopenharmony_ci 206162306a36Sopenharmony_ci break; 206262306a36Sopenharmony_ci 206362306a36Sopenharmony_ci case UD: 206462306a36Sopenharmony_ci set_arbel_ud_seg(wqe, ud_wr(wr)); 206562306a36Sopenharmony_ci wqe += sizeof (struct mthca_arbel_ud_seg); 206662306a36Sopenharmony_ci size += sizeof (struct mthca_arbel_ud_seg) / 16; 206762306a36Sopenharmony_ci break; 206862306a36Sopenharmony_ci 206962306a36Sopenharmony_ci case MLX: 207062306a36Sopenharmony_ci err = build_mlx_header( 207162306a36Sopenharmony_ci dev, qp, ind, ud_wr(wr), 207262306a36Sopenharmony_ci wqe - sizeof(struct mthca_next_seg), wqe); 207362306a36Sopenharmony_ci if (err) { 207462306a36Sopenharmony_ci *bad_wr = wr; 207562306a36Sopenharmony_ci goto out; 207662306a36Sopenharmony_ci } 207762306a36Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 207862306a36Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 207962306a36Sopenharmony_ci break; 208062306a36Sopenharmony_ci } 208162306a36Sopenharmony_ci 208262306a36Sopenharmony_ci if (wr->num_sge > qp->sq.max_gs) { 208362306a36Sopenharmony_ci mthca_err(dev, "too many gathers\n"); 208462306a36Sopenharmony_ci err = -EINVAL; 208562306a36Sopenharmony_ci *bad_wr = wr; 208662306a36Sopenharmony_ci goto out; 208762306a36Sopenharmony_ci } 208862306a36Sopenharmony_ci 208962306a36Sopenharmony_ci for (i = 0; i < wr->num_sge; ++i) { 209062306a36Sopenharmony_ci mthca_set_data_seg(wqe, wr->sg_list + i); 209162306a36Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 209262306a36Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 209362306a36Sopenharmony_ci } 209462306a36Sopenharmony_ci 209562306a36Sopenharmony_ci /* Add one more inline data segment for ICRC */ 209662306a36Sopenharmony_ci if (qp->transport == MLX) { 209762306a36Sopenharmony_ci ((struct mthca_data_seg *) wqe)->byte_count = 209862306a36Sopenharmony_ci cpu_to_be32((1 << 31) | 4); 209962306a36Sopenharmony_ci ((u32 *) wqe)[1] = 0; 210062306a36Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 210162306a36Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 210262306a36Sopenharmony_ci } 210362306a36Sopenharmony_ci 210462306a36Sopenharmony_ci qp->wrid[ind + qp->rq.max] = wr->wr_id; 210562306a36Sopenharmony_ci 210662306a36Sopenharmony_ci if (wr->opcode >= ARRAY_SIZE(mthca_opcode)) { 210762306a36Sopenharmony_ci mthca_err(dev, "opcode invalid\n"); 210862306a36Sopenharmony_ci err = -EINVAL; 210962306a36Sopenharmony_ci *bad_wr = wr; 211062306a36Sopenharmony_ci goto out; 211162306a36Sopenharmony_ci } 211262306a36Sopenharmony_ci 211362306a36Sopenharmony_ci ((struct mthca_next_seg *) prev_wqe)->nda_op = 211462306a36Sopenharmony_ci cpu_to_be32(((ind << qp->sq.wqe_shift) + 211562306a36Sopenharmony_ci qp->send_wqe_offset) | 211662306a36Sopenharmony_ci mthca_opcode[wr->opcode]); 211762306a36Sopenharmony_ci wmb(); 211862306a36Sopenharmony_ci ((struct mthca_next_seg *) prev_wqe)->ee_nds = 211962306a36Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_DBD | size | 212062306a36Sopenharmony_ci ((wr->send_flags & IB_SEND_FENCE) ? 212162306a36Sopenharmony_ci MTHCA_NEXT_FENCE : 0)); 212262306a36Sopenharmony_ci 212362306a36Sopenharmony_ci if (!nreq) { 212462306a36Sopenharmony_ci size0 = size; 212562306a36Sopenharmony_ci op0 = mthca_opcode[wr->opcode]; 212662306a36Sopenharmony_ci f0 = wr->send_flags & IB_SEND_FENCE ? 212762306a36Sopenharmony_ci MTHCA_SEND_DOORBELL_FENCE : 0; 212862306a36Sopenharmony_ci } 212962306a36Sopenharmony_ci 213062306a36Sopenharmony_ci ++ind; 213162306a36Sopenharmony_ci if (unlikely(ind >= qp->sq.max)) 213262306a36Sopenharmony_ci ind -= qp->sq.max; 213362306a36Sopenharmony_ci } 213462306a36Sopenharmony_ci 213562306a36Sopenharmony_ciout: 213662306a36Sopenharmony_ci if (likely(nreq)) { 213762306a36Sopenharmony_ci dbhi = (nreq << 24) | ((qp->sq.head & 0xffff) << 8) | f0 | op0; 213862306a36Sopenharmony_ci 213962306a36Sopenharmony_ci qp->sq.head += nreq; 214062306a36Sopenharmony_ci 214162306a36Sopenharmony_ci /* 214262306a36Sopenharmony_ci * Make sure that descriptors are written before 214362306a36Sopenharmony_ci * doorbell record. 214462306a36Sopenharmony_ci */ 214562306a36Sopenharmony_ci wmb(); 214662306a36Sopenharmony_ci *qp->sq.db = cpu_to_be32(qp->sq.head & 0xffff); 214762306a36Sopenharmony_ci 214862306a36Sopenharmony_ci /* 214962306a36Sopenharmony_ci * Make sure doorbell record is written before we 215062306a36Sopenharmony_ci * write MMIO send doorbell. 215162306a36Sopenharmony_ci */ 215262306a36Sopenharmony_ci wmb(); 215362306a36Sopenharmony_ci 215462306a36Sopenharmony_ci mthca_write64(dbhi, (qp->qpn << 8) | size0, dev->kar + MTHCA_SEND_DOORBELL, 215562306a36Sopenharmony_ci MTHCA_GET_DOORBELL_LOCK(&dev->doorbell_lock)); 215662306a36Sopenharmony_ci } 215762306a36Sopenharmony_ci 215862306a36Sopenharmony_ci spin_unlock_irqrestore(&qp->sq.lock, flags); 215962306a36Sopenharmony_ci return err; 216062306a36Sopenharmony_ci} 216162306a36Sopenharmony_ci 216262306a36Sopenharmony_ciint mthca_arbel_post_receive(struct ib_qp *ibqp, const struct ib_recv_wr *wr, 216362306a36Sopenharmony_ci const struct ib_recv_wr **bad_wr) 216462306a36Sopenharmony_ci{ 216562306a36Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 216662306a36Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 216762306a36Sopenharmony_ci unsigned long flags; 216862306a36Sopenharmony_ci int err = 0; 216962306a36Sopenharmony_ci int nreq; 217062306a36Sopenharmony_ci int ind; 217162306a36Sopenharmony_ci int i; 217262306a36Sopenharmony_ci void *wqe; 217362306a36Sopenharmony_ci 217462306a36Sopenharmony_ci spin_lock_irqsave(&qp->rq.lock, flags); 217562306a36Sopenharmony_ci 217662306a36Sopenharmony_ci /* XXX check that state is OK to post receive */ 217762306a36Sopenharmony_ci 217862306a36Sopenharmony_ci ind = qp->rq.head & (qp->rq.max - 1); 217962306a36Sopenharmony_ci 218062306a36Sopenharmony_ci for (nreq = 0; wr; ++nreq, wr = wr->next) { 218162306a36Sopenharmony_ci if (mthca_wq_overflow(&qp->rq, nreq, qp->ibqp.recv_cq)) { 218262306a36Sopenharmony_ci mthca_err(dev, "RQ %06x full (%u head, %u tail," 218362306a36Sopenharmony_ci " %d max, %d nreq)\n", qp->qpn, 218462306a36Sopenharmony_ci qp->rq.head, qp->rq.tail, 218562306a36Sopenharmony_ci qp->rq.max, nreq); 218662306a36Sopenharmony_ci err = -ENOMEM; 218762306a36Sopenharmony_ci *bad_wr = wr; 218862306a36Sopenharmony_ci goto out; 218962306a36Sopenharmony_ci } 219062306a36Sopenharmony_ci 219162306a36Sopenharmony_ci wqe = get_recv_wqe(qp, ind); 219262306a36Sopenharmony_ci 219362306a36Sopenharmony_ci ((struct mthca_next_seg *) wqe)->flags = 0; 219462306a36Sopenharmony_ci 219562306a36Sopenharmony_ci wqe += sizeof (struct mthca_next_seg); 219662306a36Sopenharmony_ci 219762306a36Sopenharmony_ci if (unlikely(wr->num_sge > qp->rq.max_gs)) { 219862306a36Sopenharmony_ci err = -EINVAL; 219962306a36Sopenharmony_ci *bad_wr = wr; 220062306a36Sopenharmony_ci goto out; 220162306a36Sopenharmony_ci } 220262306a36Sopenharmony_ci 220362306a36Sopenharmony_ci for (i = 0; i < wr->num_sge; ++i) { 220462306a36Sopenharmony_ci mthca_set_data_seg(wqe, wr->sg_list + i); 220562306a36Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 220662306a36Sopenharmony_ci } 220762306a36Sopenharmony_ci 220862306a36Sopenharmony_ci if (i < qp->rq.max_gs) 220962306a36Sopenharmony_ci mthca_set_data_seg_inval(wqe); 221062306a36Sopenharmony_ci 221162306a36Sopenharmony_ci qp->wrid[ind] = wr->wr_id; 221262306a36Sopenharmony_ci 221362306a36Sopenharmony_ci ++ind; 221462306a36Sopenharmony_ci if (unlikely(ind >= qp->rq.max)) 221562306a36Sopenharmony_ci ind -= qp->rq.max; 221662306a36Sopenharmony_ci } 221762306a36Sopenharmony_ciout: 221862306a36Sopenharmony_ci if (likely(nreq)) { 221962306a36Sopenharmony_ci qp->rq.head += nreq; 222062306a36Sopenharmony_ci 222162306a36Sopenharmony_ci /* 222262306a36Sopenharmony_ci * Make sure that descriptors are written before 222362306a36Sopenharmony_ci * doorbell record. 222462306a36Sopenharmony_ci */ 222562306a36Sopenharmony_ci wmb(); 222662306a36Sopenharmony_ci *qp->rq.db = cpu_to_be32(qp->rq.head & 0xffff); 222762306a36Sopenharmony_ci } 222862306a36Sopenharmony_ci 222962306a36Sopenharmony_ci spin_unlock_irqrestore(&qp->rq.lock, flags); 223062306a36Sopenharmony_ci return err; 223162306a36Sopenharmony_ci} 223262306a36Sopenharmony_ci 223362306a36Sopenharmony_civoid mthca_free_err_wqe(struct mthca_dev *dev, struct mthca_qp *qp, int is_send, 223462306a36Sopenharmony_ci int index, int *dbd, __be32 *new_wqe) 223562306a36Sopenharmony_ci{ 223662306a36Sopenharmony_ci struct mthca_next_seg *next; 223762306a36Sopenharmony_ci 223862306a36Sopenharmony_ci /* 223962306a36Sopenharmony_ci * For SRQs, all receive WQEs generate a CQE, so we're always 224062306a36Sopenharmony_ci * at the end of the doorbell chain. 224162306a36Sopenharmony_ci */ 224262306a36Sopenharmony_ci if (qp->ibqp.srq && !is_send) { 224362306a36Sopenharmony_ci *new_wqe = 0; 224462306a36Sopenharmony_ci return; 224562306a36Sopenharmony_ci } 224662306a36Sopenharmony_ci 224762306a36Sopenharmony_ci if (is_send) 224862306a36Sopenharmony_ci next = get_send_wqe(qp, index); 224962306a36Sopenharmony_ci else 225062306a36Sopenharmony_ci next = get_recv_wqe(qp, index); 225162306a36Sopenharmony_ci 225262306a36Sopenharmony_ci *dbd = !!(next->ee_nds & cpu_to_be32(MTHCA_NEXT_DBD)); 225362306a36Sopenharmony_ci if (next->ee_nds & cpu_to_be32(0x3f)) 225462306a36Sopenharmony_ci *new_wqe = (next->nda_op & cpu_to_be32(~0x3f)) | 225562306a36Sopenharmony_ci (next->ee_nds & cpu_to_be32(0x3f)); 225662306a36Sopenharmony_ci else 225762306a36Sopenharmony_ci *new_wqe = 0; 225862306a36Sopenharmony_ci} 225962306a36Sopenharmony_ci 226062306a36Sopenharmony_ciint mthca_init_qp_table(struct mthca_dev *dev) 226162306a36Sopenharmony_ci{ 226262306a36Sopenharmony_ci int err; 226362306a36Sopenharmony_ci int i; 226462306a36Sopenharmony_ci 226562306a36Sopenharmony_ci spin_lock_init(&dev->qp_table.lock); 226662306a36Sopenharmony_ci 226762306a36Sopenharmony_ci /* 226862306a36Sopenharmony_ci * We reserve 2 extra QPs per port for the special QPs. The 226962306a36Sopenharmony_ci * special QP for port 1 has to be even, so round up. 227062306a36Sopenharmony_ci */ 227162306a36Sopenharmony_ci dev->qp_table.sqp_start = (dev->limits.reserved_qps + 1) & ~1UL; 227262306a36Sopenharmony_ci err = mthca_alloc_init(&dev->qp_table.alloc, 227362306a36Sopenharmony_ci dev->limits.num_qps, 227462306a36Sopenharmony_ci (1 << 24) - 1, 227562306a36Sopenharmony_ci dev->qp_table.sqp_start + 227662306a36Sopenharmony_ci MTHCA_MAX_PORTS * 2); 227762306a36Sopenharmony_ci if (err) 227862306a36Sopenharmony_ci return err; 227962306a36Sopenharmony_ci 228062306a36Sopenharmony_ci err = mthca_array_init(&dev->qp_table.qp, 228162306a36Sopenharmony_ci dev->limits.num_qps); 228262306a36Sopenharmony_ci if (err) { 228362306a36Sopenharmony_ci mthca_alloc_cleanup(&dev->qp_table.alloc); 228462306a36Sopenharmony_ci return err; 228562306a36Sopenharmony_ci } 228662306a36Sopenharmony_ci 228762306a36Sopenharmony_ci for (i = 0; i < 2; ++i) { 228862306a36Sopenharmony_ci err = mthca_CONF_SPECIAL_QP(dev, i ? IB_QPT_GSI : IB_QPT_SMI, 228962306a36Sopenharmony_ci dev->qp_table.sqp_start + i * 2); 229062306a36Sopenharmony_ci if (err) { 229162306a36Sopenharmony_ci mthca_warn(dev, "CONF_SPECIAL_QP returned " 229262306a36Sopenharmony_ci "%d, aborting.\n", err); 229362306a36Sopenharmony_ci goto err_out; 229462306a36Sopenharmony_ci } 229562306a36Sopenharmony_ci } 229662306a36Sopenharmony_ci return 0; 229762306a36Sopenharmony_ci 229862306a36Sopenharmony_ci err_out: 229962306a36Sopenharmony_ci for (i = 0; i < 2; ++i) 230062306a36Sopenharmony_ci mthca_CONF_SPECIAL_QP(dev, i, 0); 230162306a36Sopenharmony_ci 230262306a36Sopenharmony_ci mthca_array_cleanup(&dev->qp_table.qp, dev->limits.num_qps); 230362306a36Sopenharmony_ci mthca_alloc_cleanup(&dev->qp_table.alloc); 230462306a36Sopenharmony_ci 230562306a36Sopenharmony_ci return err; 230662306a36Sopenharmony_ci} 230762306a36Sopenharmony_ci 230862306a36Sopenharmony_civoid mthca_cleanup_qp_table(struct mthca_dev *dev) 230962306a36Sopenharmony_ci{ 231062306a36Sopenharmony_ci int i; 231162306a36Sopenharmony_ci 231262306a36Sopenharmony_ci for (i = 0; i < 2; ++i) 231362306a36Sopenharmony_ci mthca_CONF_SPECIAL_QP(dev, i, 0); 231462306a36Sopenharmony_ci 231562306a36Sopenharmony_ci mthca_array_cleanup(&dev->qp_table.qp, dev->limits.num_qps); 231662306a36Sopenharmony_ci mthca_alloc_cleanup(&dev->qp_table.alloc); 231762306a36Sopenharmony_ci} 2318