18c2ecf20Sopenharmony_ci/* 28c2ecf20Sopenharmony_ci * Copyright (c) 2004 Topspin Communications. All rights reserved. 38c2ecf20Sopenharmony_ci * Copyright (c) 2005 Cisco Systems. All rights reserved. 48c2ecf20Sopenharmony_ci * Copyright (c) 2005 Mellanox Technologies. All rights reserved. 58c2ecf20Sopenharmony_ci * Copyright (c) 2004 Voltaire, Inc. All rights reserved. 68c2ecf20Sopenharmony_ci * 78c2ecf20Sopenharmony_ci * This software is available to you under a choice of one of two 88c2ecf20Sopenharmony_ci * licenses. You may choose to be licensed under the terms of the GNU 98c2ecf20Sopenharmony_ci * General Public License (GPL) Version 2, available from the file 108c2ecf20Sopenharmony_ci * COPYING in the main directory of this source tree, or the 118c2ecf20Sopenharmony_ci * OpenIB.org BSD license below: 128c2ecf20Sopenharmony_ci * 138c2ecf20Sopenharmony_ci * Redistribution and use in source and binary forms, with or 148c2ecf20Sopenharmony_ci * without modification, are permitted provided that the following 158c2ecf20Sopenharmony_ci * conditions are met: 168c2ecf20Sopenharmony_ci * 178c2ecf20Sopenharmony_ci * - Redistributions of source code must retain the above 188c2ecf20Sopenharmony_ci * copyright notice, this list of conditions and the following 198c2ecf20Sopenharmony_ci * disclaimer. 208c2ecf20Sopenharmony_ci * 218c2ecf20Sopenharmony_ci * - Redistributions in binary form must reproduce the above 228c2ecf20Sopenharmony_ci * copyright notice, this list of conditions and the following 238c2ecf20Sopenharmony_ci * disclaimer in the documentation and/or other materials 248c2ecf20Sopenharmony_ci * provided with the distribution. 258c2ecf20Sopenharmony_ci * 268c2ecf20Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 278c2ecf20Sopenharmony_ci * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 288c2ecf20Sopenharmony_ci * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 298c2ecf20Sopenharmony_ci * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 308c2ecf20Sopenharmony_ci * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 318c2ecf20Sopenharmony_ci * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 328c2ecf20Sopenharmony_ci * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 338c2ecf20Sopenharmony_ci * SOFTWARE. 348c2ecf20Sopenharmony_ci */ 358c2ecf20Sopenharmony_ci 368c2ecf20Sopenharmony_ci#include <linux/string.h> 378c2ecf20Sopenharmony_ci#include <linux/slab.h> 388c2ecf20Sopenharmony_ci#include <linux/sched.h> 398c2ecf20Sopenharmony_ci 408c2ecf20Sopenharmony_ci#include <asm/io.h> 418c2ecf20Sopenharmony_ci 428c2ecf20Sopenharmony_ci#include <rdma/ib_verbs.h> 438c2ecf20Sopenharmony_ci#include <rdma/ib_cache.h> 448c2ecf20Sopenharmony_ci#include <rdma/ib_pack.h> 458c2ecf20Sopenharmony_ci#include <rdma/uverbs_ioctl.h> 468c2ecf20Sopenharmony_ci 478c2ecf20Sopenharmony_ci#include "mthca_dev.h" 488c2ecf20Sopenharmony_ci#include "mthca_cmd.h" 498c2ecf20Sopenharmony_ci#include "mthca_memfree.h" 508c2ecf20Sopenharmony_ci#include "mthca_wqe.h" 518c2ecf20Sopenharmony_ci 528c2ecf20Sopenharmony_cienum { 538c2ecf20Sopenharmony_ci MTHCA_MAX_DIRECT_QP_SIZE = 4 * PAGE_SIZE, 548c2ecf20Sopenharmony_ci MTHCA_ACK_REQ_FREQ = 10, 558c2ecf20Sopenharmony_ci MTHCA_FLIGHT_LIMIT = 9, 568c2ecf20Sopenharmony_ci MTHCA_UD_HEADER_SIZE = 72, /* largest UD header possible */ 578c2ecf20Sopenharmony_ci MTHCA_INLINE_HEADER_SIZE = 4, /* data segment overhead for inline */ 588c2ecf20Sopenharmony_ci MTHCA_INLINE_CHUNK_SIZE = 16 /* inline data segment chunk */ 598c2ecf20Sopenharmony_ci}; 608c2ecf20Sopenharmony_ci 618c2ecf20Sopenharmony_cienum { 628c2ecf20Sopenharmony_ci MTHCA_QP_STATE_RST = 0, 638c2ecf20Sopenharmony_ci MTHCA_QP_STATE_INIT = 1, 648c2ecf20Sopenharmony_ci MTHCA_QP_STATE_RTR = 2, 658c2ecf20Sopenharmony_ci MTHCA_QP_STATE_RTS = 3, 668c2ecf20Sopenharmony_ci MTHCA_QP_STATE_SQE = 4, 678c2ecf20Sopenharmony_ci MTHCA_QP_STATE_SQD = 5, 688c2ecf20Sopenharmony_ci MTHCA_QP_STATE_ERR = 6, 698c2ecf20Sopenharmony_ci MTHCA_QP_STATE_DRAINING = 7 708c2ecf20Sopenharmony_ci}; 718c2ecf20Sopenharmony_ci 728c2ecf20Sopenharmony_cienum { 738c2ecf20Sopenharmony_ci MTHCA_QP_ST_RC = 0x0, 748c2ecf20Sopenharmony_ci MTHCA_QP_ST_UC = 0x1, 758c2ecf20Sopenharmony_ci MTHCA_QP_ST_RD = 0x2, 768c2ecf20Sopenharmony_ci MTHCA_QP_ST_UD = 0x3, 778c2ecf20Sopenharmony_ci MTHCA_QP_ST_MLX = 0x7 788c2ecf20Sopenharmony_ci}; 798c2ecf20Sopenharmony_ci 808c2ecf20Sopenharmony_cienum { 818c2ecf20Sopenharmony_ci MTHCA_QP_PM_MIGRATED = 0x3, 828c2ecf20Sopenharmony_ci MTHCA_QP_PM_ARMED = 0x0, 838c2ecf20Sopenharmony_ci MTHCA_QP_PM_REARM = 0x1 848c2ecf20Sopenharmony_ci}; 858c2ecf20Sopenharmony_ci 868c2ecf20Sopenharmony_cienum { 878c2ecf20Sopenharmony_ci /* qp_context flags */ 888c2ecf20Sopenharmony_ci MTHCA_QP_BIT_DE = 1 << 8, 898c2ecf20Sopenharmony_ci /* params1 */ 908c2ecf20Sopenharmony_ci MTHCA_QP_BIT_SRE = 1 << 15, 918c2ecf20Sopenharmony_ci MTHCA_QP_BIT_SWE = 1 << 14, 928c2ecf20Sopenharmony_ci MTHCA_QP_BIT_SAE = 1 << 13, 938c2ecf20Sopenharmony_ci MTHCA_QP_BIT_SIC = 1 << 4, 948c2ecf20Sopenharmony_ci MTHCA_QP_BIT_SSC = 1 << 3, 958c2ecf20Sopenharmony_ci /* params2 */ 968c2ecf20Sopenharmony_ci MTHCA_QP_BIT_RRE = 1 << 15, 978c2ecf20Sopenharmony_ci MTHCA_QP_BIT_RWE = 1 << 14, 988c2ecf20Sopenharmony_ci MTHCA_QP_BIT_RAE = 1 << 13, 998c2ecf20Sopenharmony_ci MTHCA_QP_BIT_RIC = 1 << 4, 1008c2ecf20Sopenharmony_ci MTHCA_QP_BIT_RSC = 1 << 3 1018c2ecf20Sopenharmony_ci}; 1028c2ecf20Sopenharmony_ci 1038c2ecf20Sopenharmony_cienum { 1048c2ecf20Sopenharmony_ci MTHCA_SEND_DOORBELL_FENCE = 1 << 5 1058c2ecf20Sopenharmony_ci}; 1068c2ecf20Sopenharmony_ci 1078c2ecf20Sopenharmony_cistruct mthca_qp_path { 1088c2ecf20Sopenharmony_ci __be32 port_pkey; 1098c2ecf20Sopenharmony_ci u8 rnr_retry; 1108c2ecf20Sopenharmony_ci u8 g_mylmc; 1118c2ecf20Sopenharmony_ci __be16 rlid; 1128c2ecf20Sopenharmony_ci u8 ackto; 1138c2ecf20Sopenharmony_ci u8 mgid_index; 1148c2ecf20Sopenharmony_ci u8 static_rate; 1158c2ecf20Sopenharmony_ci u8 hop_limit; 1168c2ecf20Sopenharmony_ci __be32 sl_tclass_flowlabel; 1178c2ecf20Sopenharmony_ci u8 rgid[16]; 1188c2ecf20Sopenharmony_ci} __packed; 1198c2ecf20Sopenharmony_ci 1208c2ecf20Sopenharmony_cistruct mthca_qp_context { 1218c2ecf20Sopenharmony_ci __be32 flags; 1228c2ecf20Sopenharmony_ci __be32 tavor_sched_queue; /* Reserved on Arbel */ 1238c2ecf20Sopenharmony_ci u8 mtu_msgmax; 1248c2ecf20Sopenharmony_ci u8 rq_size_stride; /* Reserved on Tavor */ 1258c2ecf20Sopenharmony_ci u8 sq_size_stride; /* Reserved on Tavor */ 1268c2ecf20Sopenharmony_ci u8 rlkey_arbel_sched_queue; /* Reserved on Tavor */ 1278c2ecf20Sopenharmony_ci __be32 usr_page; 1288c2ecf20Sopenharmony_ci __be32 local_qpn; 1298c2ecf20Sopenharmony_ci __be32 remote_qpn; 1308c2ecf20Sopenharmony_ci u32 reserved1[2]; 1318c2ecf20Sopenharmony_ci struct mthca_qp_path pri_path; 1328c2ecf20Sopenharmony_ci struct mthca_qp_path alt_path; 1338c2ecf20Sopenharmony_ci __be32 rdd; 1348c2ecf20Sopenharmony_ci __be32 pd; 1358c2ecf20Sopenharmony_ci __be32 wqe_base; 1368c2ecf20Sopenharmony_ci __be32 wqe_lkey; 1378c2ecf20Sopenharmony_ci __be32 params1; 1388c2ecf20Sopenharmony_ci __be32 reserved2; 1398c2ecf20Sopenharmony_ci __be32 next_send_psn; 1408c2ecf20Sopenharmony_ci __be32 cqn_snd; 1418c2ecf20Sopenharmony_ci __be32 snd_wqe_base_l; /* Next send WQE on Tavor */ 1428c2ecf20Sopenharmony_ci __be32 snd_db_index; /* (debugging only entries) */ 1438c2ecf20Sopenharmony_ci __be32 last_acked_psn; 1448c2ecf20Sopenharmony_ci __be32 ssn; 1458c2ecf20Sopenharmony_ci __be32 params2; 1468c2ecf20Sopenharmony_ci __be32 rnr_nextrecvpsn; 1478c2ecf20Sopenharmony_ci __be32 ra_buff_indx; 1488c2ecf20Sopenharmony_ci __be32 cqn_rcv; 1498c2ecf20Sopenharmony_ci __be32 rcv_wqe_base_l; /* Next recv WQE on Tavor */ 1508c2ecf20Sopenharmony_ci __be32 rcv_db_index; /* (debugging only entries) */ 1518c2ecf20Sopenharmony_ci __be32 qkey; 1528c2ecf20Sopenharmony_ci __be32 srqn; 1538c2ecf20Sopenharmony_ci __be32 rmsn; 1548c2ecf20Sopenharmony_ci __be16 rq_wqe_counter; /* reserved on Tavor */ 1558c2ecf20Sopenharmony_ci __be16 sq_wqe_counter; /* reserved on Tavor */ 1568c2ecf20Sopenharmony_ci u32 reserved3[18]; 1578c2ecf20Sopenharmony_ci} __packed; 1588c2ecf20Sopenharmony_ci 1598c2ecf20Sopenharmony_cistruct mthca_qp_param { 1608c2ecf20Sopenharmony_ci __be32 opt_param_mask; 1618c2ecf20Sopenharmony_ci u32 reserved1; 1628c2ecf20Sopenharmony_ci struct mthca_qp_context context; 1638c2ecf20Sopenharmony_ci u32 reserved2[62]; 1648c2ecf20Sopenharmony_ci} __packed; 1658c2ecf20Sopenharmony_ci 1668c2ecf20Sopenharmony_cienum { 1678c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_ALT_ADDR_PATH = 1 << 0, 1688c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_RRE = 1 << 1, 1698c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_RAE = 1 << 2, 1708c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_RWE = 1 << 3, 1718c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_PKEY_INDEX = 1 << 4, 1728c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_Q_KEY = 1 << 5, 1738c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_RNR_TIMEOUT = 1 << 6, 1748c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_PRIMARY_ADDR_PATH = 1 << 7, 1758c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_SRA_MAX = 1 << 8, 1768c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_RRA_MAX = 1 << 9, 1778c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_PM_STATE = 1 << 10, 1788c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_PORT_NUM = 1 << 11, 1798c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_RETRY_COUNT = 1 << 12, 1808c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_ALT_RNR_RETRY = 1 << 13, 1818c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_ACK_TIMEOUT = 1 << 14, 1828c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_RNR_RETRY = 1 << 15, 1838c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_SCHED_QUEUE = 1 << 16 1848c2ecf20Sopenharmony_ci}; 1858c2ecf20Sopenharmony_ci 1868c2ecf20Sopenharmony_cistatic const u8 mthca_opcode[] = { 1878c2ecf20Sopenharmony_ci [IB_WR_SEND] = MTHCA_OPCODE_SEND, 1888c2ecf20Sopenharmony_ci [IB_WR_SEND_WITH_IMM] = MTHCA_OPCODE_SEND_IMM, 1898c2ecf20Sopenharmony_ci [IB_WR_RDMA_WRITE] = MTHCA_OPCODE_RDMA_WRITE, 1908c2ecf20Sopenharmony_ci [IB_WR_RDMA_WRITE_WITH_IMM] = MTHCA_OPCODE_RDMA_WRITE_IMM, 1918c2ecf20Sopenharmony_ci [IB_WR_RDMA_READ] = MTHCA_OPCODE_RDMA_READ, 1928c2ecf20Sopenharmony_ci [IB_WR_ATOMIC_CMP_AND_SWP] = MTHCA_OPCODE_ATOMIC_CS, 1938c2ecf20Sopenharmony_ci [IB_WR_ATOMIC_FETCH_AND_ADD] = MTHCA_OPCODE_ATOMIC_FA, 1948c2ecf20Sopenharmony_ci}; 1958c2ecf20Sopenharmony_ci 1968c2ecf20Sopenharmony_cistatic int is_sqp(struct mthca_dev *dev, struct mthca_qp *qp) 1978c2ecf20Sopenharmony_ci{ 1988c2ecf20Sopenharmony_ci return qp->qpn >= dev->qp_table.sqp_start && 1998c2ecf20Sopenharmony_ci qp->qpn <= dev->qp_table.sqp_start + 3; 2008c2ecf20Sopenharmony_ci} 2018c2ecf20Sopenharmony_ci 2028c2ecf20Sopenharmony_cistatic int is_qp0(struct mthca_dev *dev, struct mthca_qp *qp) 2038c2ecf20Sopenharmony_ci{ 2048c2ecf20Sopenharmony_ci return qp->qpn >= dev->qp_table.sqp_start && 2058c2ecf20Sopenharmony_ci qp->qpn <= dev->qp_table.sqp_start + 1; 2068c2ecf20Sopenharmony_ci} 2078c2ecf20Sopenharmony_ci 2088c2ecf20Sopenharmony_cistatic void *get_recv_wqe(struct mthca_qp *qp, int n) 2098c2ecf20Sopenharmony_ci{ 2108c2ecf20Sopenharmony_ci if (qp->is_direct) 2118c2ecf20Sopenharmony_ci return qp->queue.direct.buf + (n << qp->rq.wqe_shift); 2128c2ecf20Sopenharmony_ci else 2138c2ecf20Sopenharmony_ci return qp->queue.page_list[(n << qp->rq.wqe_shift) >> PAGE_SHIFT].buf + 2148c2ecf20Sopenharmony_ci ((n << qp->rq.wqe_shift) & (PAGE_SIZE - 1)); 2158c2ecf20Sopenharmony_ci} 2168c2ecf20Sopenharmony_ci 2178c2ecf20Sopenharmony_cistatic void *get_send_wqe(struct mthca_qp *qp, int n) 2188c2ecf20Sopenharmony_ci{ 2198c2ecf20Sopenharmony_ci if (qp->is_direct) 2208c2ecf20Sopenharmony_ci return qp->queue.direct.buf + qp->send_wqe_offset + 2218c2ecf20Sopenharmony_ci (n << qp->sq.wqe_shift); 2228c2ecf20Sopenharmony_ci else 2238c2ecf20Sopenharmony_ci return qp->queue.page_list[(qp->send_wqe_offset + 2248c2ecf20Sopenharmony_ci (n << qp->sq.wqe_shift)) >> 2258c2ecf20Sopenharmony_ci PAGE_SHIFT].buf + 2268c2ecf20Sopenharmony_ci ((qp->send_wqe_offset + (n << qp->sq.wqe_shift)) & 2278c2ecf20Sopenharmony_ci (PAGE_SIZE - 1)); 2288c2ecf20Sopenharmony_ci} 2298c2ecf20Sopenharmony_ci 2308c2ecf20Sopenharmony_cistatic void mthca_wq_reset(struct mthca_wq *wq) 2318c2ecf20Sopenharmony_ci{ 2328c2ecf20Sopenharmony_ci wq->next_ind = 0; 2338c2ecf20Sopenharmony_ci wq->last_comp = wq->max - 1; 2348c2ecf20Sopenharmony_ci wq->head = 0; 2358c2ecf20Sopenharmony_ci wq->tail = 0; 2368c2ecf20Sopenharmony_ci} 2378c2ecf20Sopenharmony_ci 2388c2ecf20Sopenharmony_civoid mthca_qp_event(struct mthca_dev *dev, u32 qpn, 2398c2ecf20Sopenharmony_ci enum ib_event_type event_type) 2408c2ecf20Sopenharmony_ci{ 2418c2ecf20Sopenharmony_ci struct mthca_qp *qp; 2428c2ecf20Sopenharmony_ci struct ib_event event; 2438c2ecf20Sopenharmony_ci 2448c2ecf20Sopenharmony_ci spin_lock(&dev->qp_table.lock); 2458c2ecf20Sopenharmony_ci qp = mthca_array_get(&dev->qp_table.qp, qpn & (dev->limits.num_qps - 1)); 2468c2ecf20Sopenharmony_ci if (qp) 2478c2ecf20Sopenharmony_ci ++qp->refcount; 2488c2ecf20Sopenharmony_ci spin_unlock(&dev->qp_table.lock); 2498c2ecf20Sopenharmony_ci 2508c2ecf20Sopenharmony_ci if (!qp) { 2518c2ecf20Sopenharmony_ci mthca_warn(dev, "Async event %d for bogus QP %08x\n", 2528c2ecf20Sopenharmony_ci event_type, qpn); 2538c2ecf20Sopenharmony_ci return; 2548c2ecf20Sopenharmony_ci } 2558c2ecf20Sopenharmony_ci 2568c2ecf20Sopenharmony_ci if (event_type == IB_EVENT_PATH_MIG) 2578c2ecf20Sopenharmony_ci qp->port = qp->alt_port; 2588c2ecf20Sopenharmony_ci 2598c2ecf20Sopenharmony_ci event.device = &dev->ib_dev; 2608c2ecf20Sopenharmony_ci event.event = event_type; 2618c2ecf20Sopenharmony_ci event.element.qp = &qp->ibqp; 2628c2ecf20Sopenharmony_ci if (qp->ibqp.event_handler) 2638c2ecf20Sopenharmony_ci qp->ibqp.event_handler(&event, qp->ibqp.qp_context); 2648c2ecf20Sopenharmony_ci 2658c2ecf20Sopenharmony_ci spin_lock(&dev->qp_table.lock); 2668c2ecf20Sopenharmony_ci if (!--qp->refcount) 2678c2ecf20Sopenharmony_ci wake_up(&qp->wait); 2688c2ecf20Sopenharmony_ci spin_unlock(&dev->qp_table.lock); 2698c2ecf20Sopenharmony_ci} 2708c2ecf20Sopenharmony_ci 2718c2ecf20Sopenharmony_cistatic int to_mthca_state(enum ib_qp_state ib_state) 2728c2ecf20Sopenharmony_ci{ 2738c2ecf20Sopenharmony_ci switch (ib_state) { 2748c2ecf20Sopenharmony_ci case IB_QPS_RESET: return MTHCA_QP_STATE_RST; 2758c2ecf20Sopenharmony_ci case IB_QPS_INIT: return MTHCA_QP_STATE_INIT; 2768c2ecf20Sopenharmony_ci case IB_QPS_RTR: return MTHCA_QP_STATE_RTR; 2778c2ecf20Sopenharmony_ci case IB_QPS_RTS: return MTHCA_QP_STATE_RTS; 2788c2ecf20Sopenharmony_ci case IB_QPS_SQD: return MTHCA_QP_STATE_SQD; 2798c2ecf20Sopenharmony_ci case IB_QPS_SQE: return MTHCA_QP_STATE_SQE; 2808c2ecf20Sopenharmony_ci case IB_QPS_ERR: return MTHCA_QP_STATE_ERR; 2818c2ecf20Sopenharmony_ci default: return -1; 2828c2ecf20Sopenharmony_ci } 2838c2ecf20Sopenharmony_ci} 2848c2ecf20Sopenharmony_ci 2858c2ecf20Sopenharmony_cienum { RC, UC, UD, RD, RDEE, MLX, NUM_TRANS }; 2868c2ecf20Sopenharmony_ci 2878c2ecf20Sopenharmony_cistatic int to_mthca_st(int transport) 2888c2ecf20Sopenharmony_ci{ 2898c2ecf20Sopenharmony_ci switch (transport) { 2908c2ecf20Sopenharmony_ci case RC: return MTHCA_QP_ST_RC; 2918c2ecf20Sopenharmony_ci case UC: return MTHCA_QP_ST_UC; 2928c2ecf20Sopenharmony_ci case UD: return MTHCA_QP_ST_UD; 2938c2ecf20Sopenharmony_ci case RD: return MTHCA_QP_ST_RD; 2948c2ecf20Sopenharmony_ci case MLX: return MTHCA_QP_ST_MLX; 2958c2ecf20Sopenharmony_ci default: return -1; 2968c2ecf20Sopenharmony_ci } 2978c2ecf20Sopenharmony_ci} 2988c2ecf20Sopenharmony_ci 2998c2ecf20Sopenharmony_cistatic void store_attrs(struct mthca_sqp *sqp, const struct ib_qp_attr *attr, 3008c2ecf20Sopenharmony_ci int attr_mask) 3018c2ecf20Sopenharmony_ci{ 3028c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_PKEY_INDEX) 3038c2ecf20Sopenharmony_ci sqp->pkey_index = attr->pkey_index; 3048c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_QKEY) 3058c2ecf20Sopenharmony_ci sqp->qkey = attr->qkey; 3068c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_SQ_PSN) 3078c2ecf20Sopenharmony_ci sqp->send_psn = attr->sq_psn; 3088c2ecf20Sopenharmony_ci} 3098c2ecf20Sopenharmony_ci 3108c2ecf20Sopenharmony_cistatic void init_port(struct mthca_dev *dev, int port) 3118c2ecf20Sopenharmony_ci{ 3128c2ecf20Sopenharmony_ci int err; 3138c2ecf20Sopenharmony_ci struct mthca_init_ib_param param; 3148c2ecf20Sopenharmony_ci 3158c2ecf20Sopenharmony_ci memset(¶m, 0, sizeof param); 3168c2ecf20Sopenharmony_ci 3178c2ecf20Sopenharmony_ci param.port_width = dev->limits.port_width_cap; 3188c2ecf20Sopenharmony_ci param.vl_cap = dev->limits.vl_cap; 3198c2ecf20Sopenharmony_ci param.mtu_cap = dev->limits.mtu_cap; 3208c2ecf20Sopenharmony_ci param.gid_cap = dev->limits.gid_table_len; 3218c2ecf20Sopenharmony_ci param.pkey_cap = dev->limits.pkey_table_len; 3228c2ecf20Sopenharmony_ci 3238c2ecf20Sopenharmony_ci err = mthca_INIT_IB(dev, ¶m, port); 3248c2ecf20Sopenharmony_ci if (err) 3258c2ecf20Sopenharmony_ci mthca_warn(dev, "INIT_IB failed, return code %d.\n", err); 3268c2ecf20Sopenharmony_ci} 3278c2ecf20Sopenharmony_ci 3288c2ecf20Sopenharmony_cistatic __be32 get_hw_access_flags(struct mthca_qp *qp, const struct ib_qp_attr *attr, 3298c2ecf20Sopenharmony_ci int attr_mask) 3308c2ecf20Sopenharmony_ci{ 3318c2ecf20Sopenharmony_ci u8 dest_rd_atomic; 3328c2ecf20Sopenharmony_ci u32 access_flags; 3338c2ecf20Sopenharmony_ci u32 hw_access_flags = 0; 3348c2ecf20Sopenharmony_ci 3358c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_MAX_DEST_RD_ATOMIC) 3368c2ecf20Sopenharmony_ci dest_rd_atomic = attr->max_dest_rd_atomic; 3378c2ecf20Sopenharmony_ci else 3388c2ecf20Sopenharmony_ci dest_rd_atomic = qp->resp_depth; 3398c2ecf20Sopenharmony_ci 3408c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_ACCESS_FLAGS) 3418c2ecf20Sopenharmony_ci access_flags = attr->qp_access_flags; 3428c2ecf20Sopenharmony_ci else 3438c2ecf20Sopenharmony_ci access_flags = qp->atomic_rd_en; 3448c2ecf20Sopenharmony_ci 3458c2ecf20Sopenharmony_ci if (!dest_rd_atomic) 3468c2ecf20Sopenharmony_ci access_flags &= IB_ACCESS_REMOTE_WRITE; 3478c2ecf20Sopenharmony_ci 3488c2ecf20Sopenharmony_ci if (access_flags & IB_ACCESS_REMOTE_READ) 3498c2ecf20Sopenharmony_ci hw_access_flags |= MTHCA_QP_BIT_RRE; 3508c2ecf20Sopenharmony_ci if (access_flags & IB_ACCESS_REMOTE_ATOMIC) 3518c2ecf20Sopenharmony_ci hw_access_flags |= MTHCA_QP_BIT_RAE; 3528c2ecf20Sopenharmony_ci if (access_flags & IB_ACCESS_REMOTE_WRITE) 3538c2ecf20Sopenharmony_ci hw_access_flags |= MTHCA_QP_BIT_RWE; 3548c2ecf20Sopenharmony_ci 3558c2ecf20Sopenharmony_ci return cpu_to_be32(hw_access_flags); 3568c2ecf20Sopenharmony_ci} 3578c2ecf20Sopenharmony_ci 3588c2ecf20Sopenharmony_cistatic inline enum ib_qp_state to_ib_qp_state(int mthca_state) 3598c2ecf20Sopenharmony_ci{ 3608c2ecf20Sopenharmony_ci switch (mthca_state) { 3618c2ecf20Sopenharmony_ci case MTHCA_QP_STATE_RST: return IB_QPS_RESET; 3628c2ecf20Sopenharmony_ci case MTHCA_QP_STATE_INIT: return IB_QPS_INIT; 3638c2ecf20Sopenharmony_ci case MTHCA_QP_STATE_RTR: return IB_QPS_RTR; 3648c2ecf20Sopenharmony_ci case MTHCA_QP_STATE_RTS: return IB_QPS_RTS; 3658c2ecf20Sopenharmony_ci case MTHCA_QP_STATE_DRAINING: 3668c2ecf20Sopenharmony_ci case MTHCA_QP_STATE_SQD: return IB_QPS_SQD; 3678c2ecf20Sopenharmony_ci case MTHCA_QP_STATE_SQE: return IB_QPS_SQE; 3688c2ecf20Sopenharmony_ci case MTHCA_QP_STATE_ERR: return IB_QPS_ERR; 3698c2ecf20Sopenharmony_ci default: return -1; 3708c2ecf20Sopenharmony_ci } 3718c2ecf20Sopenharmony_ci} 3728c2ecf20Sopenharmony_ci 3738c2ecf20Sopenharmony_cistatic inline enum ib_mig_state to_ib_mig_state(int mthca_mig_state) 3748c2ecf20Sopenharmony_ci{ 3758c2ecf20Sopenharmony_ci switch (mthca_mig_state) { 3768c2ecf20Sopenharmony_ci case 0: return IB_MIG_ARMED; 3778c2ecf20Sopenharmony_ci case 1: return IB_MIG_REARM; 3788c2ecf20Sopenharmony_ci case 3: return IB_MIG_MIGRATED; 3798c2ecf20Sopenharmony_ci default: return -1; 3808c2ecf20Sopenharmony_ci } 3818c2ecf20Sopenharmony_ci} 3828c2ecf20Sopenharmony_ci 3838c2ecf20Sopenharmony_cistatic int to_ib_qp_access_flags(int mthca_flags) 3848c2ecf20Sopenharmony_ci{ 3858c2ecf20Sopenharmony_ci int ib_flags = 0; 3868c2ecf20Sopenharmony_ci 3878c2ecf20Sopenharmony_ci if (mthca_flags & MTHCA_QP_BIT_RRE) 3888c2ecf20Sopenharmony_ci ib_flags |= IB_ACCESS_REMOTE_READ; 3898c2ecf20Sopenharmony_ci if (mthca_flags & MTHCA_QP_BIT_RWE) 3908c2ecf20Sopenharmony_ci ib_flags |= IB_ACCESS_REMOTE_WRITE; 3918c2ecf20Sopenharmony_ci if (mthca_flags & MTHCA_QP_BIT_RAE) 3928c2ecf20Sopenharmony_ci ib_flags |= IB_ACCESS_REMOTE_ATOMIC; 3938c2ecf20Sopenharmony_ci 3948c2ecf20Sopenharmony_ci return ib_flags; 3958c2ecf20Sopenharmony_ci} 3968c2ecf20Sopenharmony_ci 3978c2ecf20Sopenharmony_cistatic void to_rdma_ah_attr(struct mthca_dev *dev, 3988c2ecf20Sopenharmony_ci struct rdma_ah_attr *ah_attr, 3998c2ecf20Sopenharmony_ci struct mthca_qp_path *path) 4008c2ecf20Sopenharmony_ci{ 4018c2ecf20Sopenharmony_ci u8 port_num = (be32_to_cpu(path->port_pkey) >> 24) & 0x3; 4028c2ecf20Sopenharmony_ci 4038c2ecf20Sopenharmony_ci memset(ah_attr, 0, sizeof(*ah_attr)); 4048c2ecf20Sopenharmony_ci 4058c2ecf20Sopenharmony_ci if (port_num == 0 || port_num > dev->limits.num_ports) 4068c2ecf20Sopenharmony_ci return; 4078c2ecf20Sopenharmony_ci ah_attr->type = rdma_ah_find_type(&dev->ib_dev, port_num); 4088c2ecf20Sopenharmony_ci rdma_ah_set_port_num(ah_attr, port_num); 4098c2ecf20Sopenharmony_ci 4108c2ecf20Sopenharmony_ci rdma_ah_set_dlid(ah_attr, be16_to_cpu(path->rlid)); 4118c2ecf20Sopenharmony_ci rdma_ah_set_sl(ah_attr, be32_to_cpu(path->sl_tclass_flowlabel) >> 28); 4128c2ecf20Sopenharmony_ci rdma_ah_set_path_bits(ah_attr, path->g_mylmc & 0x7f); 4138c2ecf20Sopenharmony_ci rdma_ah_set_static_rate(ah_attr, 4148c2ecf20Sopenharmony_ci mthca_rate_to_ib(dev, 4158c2ecf20Sopenharmony_ci path->static_rate & 0xf, 4168c2ecf20Sopenharmony_ci port_num)); 4178c2ecf20Sopenharmony_ci if (path->g_mylmc & (1 << 7)) { 4188c2ecf20Sopenharmony_ci u32 tc_fl = be32_to_cpu(path->sl_tclass_flowlabel); 4198c2ecf20Sopenharmony_ci 4208c2ecf20Sopenharmony_ci rdma_ah_set_grh(ah_attr, NULL, 4218c2ecf20Sopenharmony_ci tc_fl & 0xfffff, 4228c2ecf20Sopenharmony_ci path->mgid_index & 4238c2ecf20Sopenharmony_ci (dev->limits.gid_table_len - 1), 4248c2ecf20Sopenharmony_ci path->hop_limit, 4258c2ecf20Sopenharmony_ci (tc_fl >> 20) & 0xff); 4268c2ecf20Sopenharmony_ci rdma_ah_set_dgid_raw(ah_attr, path->rgid); 4278c2ecf20Sopenharmony_ci } 4288c2ecf20Sopenharmony_ci} 4298c2ecf20Sopenharmony_ci 4308c2ecf20Sopenharmony_ciint mthca_query_qp(struct ib_qp *ibqp, struct ib_qp_attr *qp_attr, int qp_attr_mask, 4318c2ecf20Sopenharmony_ci struct ib_qp_init_attr *qp_init_attr) 4328c2ecf20Sopenharmony_ci{ 4338c2ecf20Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 4348c2ecf20Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 4358c2ecf20Sopenharmony_ci int err = 0; 4368c2ecf20Sopenharmony_ci struct mthca_mailbox *mailbox = NULL; 4378c2ecf20Sopenharmony_ci struct mthca_qp_param *qp_param; 4388c2ecf20Sopenharmony_ci struct mthca_qp_context *context; 4398c2ecf20Sopenharmony_ci int mthca_state; 4408c2ecf20Sopenharmony_ci 4418c2ecf20Sopenharmony_ci mutex_lock(&qp->mutex); 4428c2ecf20Sopenharmony_ci 4438c2ecf20Sopenharmony_ci if (qp->state == IB_QPS_RESET) { 4448c2ecf20Sopenharmony_ci qp_attr->qp_state = IB_QPS_RESET; 4458c2ecf20Sopenharmony_ci goto done; 4468c2ecf20Sopenharmony_ci } 4478c2ecf20Sopenharmony_ci 4488c2ecf20Sopenharmony_ci mailbox = mthca_alloc_mailbox(dev, GFP_KERNEL); 4498c2ecf20Sopenharmony_ci if (IS_ERR(mailbox)) { 4508c2ecf20Sopenharmony_ci err = PTR_ERR(mailbox); 4518c2ecf20Sopenharmony_ci goto out; 4528c2ecf20Sopenharmony_ci } 4538c2ecf20Sopenharmony_ci 4548c2ecf20Sopenharmony_ci err = mthca_QUERY_QP(dev, qp->qpn, 0, mailbox); 4558c2ecf20Sopenharmony_ci if (err) { 4568c2ecf20Sopenharmony_ci mthca_warn(dev, "QUERY_QP failed (%d)\n", err); 4578c2ecf20Sopenharmony_ci goto out_mailbox; 4588c2ecf20Sopenharmony_ci } 4598c2ecf20Sopenharmony_ci 4608c2ecf20Sopenharmony_ci qp_param = mailbox->buf; 4618c2ecf20Sopenharmony_ci context = &qp_param->context; 4628c2ecf20Sopenharmony_ci mthca_state = be32_to_cpu(context->flags) >> 28; 4638c2ecf20Sopenharmony_ci 4648c2ecf20Sopenharmony_ci qp->state = to_ib_qp_state(mthca_state); 4658c2ecf20Sopenharmony_ci qp_attr->qp_state = qp->state; 4668c2ecf20Sopenharmony_ci qp_attr->path_mtu = context->mtu_msgmax >> 5; 4678c2ecf20Sopenharmony_ci qp_attr->path_mig_state = 4688c2ecf20Sopenharmony_ci to_ib_mig_state((be32_to_cpu(context->flags) >> 11) & 0x3); 4698c2ecf20Sopenharmony_ci qp_attr->qkey = be32_to_cpu(context->qkey); 4708c2ecf20Sopenharmony_ci qp_attr->rq_psn = be32_to_cpu(context->rnr_nextrecvpsn) & 0xffffff; 4718c2ecf20Sopenharmony_ci qp_attr->sq_psn = be32_to_cpu(context->next_send_psn) & 0xffffff; 4728c2ecf20Sopenharmony_ci qp_attr->dest_qp_num = be32_to_cpu(context->remote_qpn) & 0xffffff; 4738c2ecf20Sopenharmony_ci qp_attr->qp_access_flags = 4748c2ecf20Sopenharmony_ci to_ib_qp_access_flags(be32_to_cpu(context->params2)); 4758c2ecf20Sopenharmony_ci 4768c2ecf20Sopenharmony_ci if (qp->transport == RC || qp->transport == UC) { 4778c2ecf20Sopenharmony_ci to_rdma_ah_attr(dev, &qp_attr->ah_attr, &context->pri_path); 4788c2ecf20Sopenharmony_ci to_rdma_ah_attr(dev, &qp_attr->alt_ah_attr, &context->alt_path); 4798c2ecf20Sopenharmony_ci qp_attr->alt_pkey_index = 4808c2ecf20Sopenharmony_ci be32_to_cpu(context->alt_path.port_pkey) & 0x7f; 4818c2ecf20Sopenharmony_ci qp_attr->alt_port_num = 4828c2ecf20Sopenharmony_ci rdma_ah_get_port_num(&qp_attr->alt_ah_attr); 4838c2ecf20Sopenharmony_ci } 4848c2ecf20Sopenharmony_ci 4858c2ecf20Sopenharmony_ci qp_attr->pkey_index = be32_to_cpu(context->pri_path.port_pkey) & 0x7f; 4868c2ecf20Sopenharmony_ci qp_attr->port_num = 4878c2ecf20Sopenharmony_ci (be32_to_cpu(context->pri_path.port_pkey) >> 24) & 0x3; 4888c2ecf20Sopenharmony_ci 4898c2ecf20Sopenharmony_ci /* qp_attr->en_sqd_async_notify is only applicable in modify qp */ 4908c2ecf20Sopenharmony_ci qp_attr->sq_draining = mthca_state == MTHCA_QP_STATE_DRAINING; 4918c2ecf20Sopenharmony_ci 4928c2ecf20Sopenharmony_ci qp_attr->max_rd_atomic = 1 << ((be32_to_cpu(context->params1) >> 21) & 0x7); 4938c2ecf20Sopenharmony_ci 4948c2ecf20Sopenharmony_ci qp_attr->max_dest_rd_atomic = 4958c2ecf20Sopenharmony_ci 1 << ((be32_to_cpu(context->params2) >> 21) & 0x7); 4968c2ecf20Sopenharmony_ci qp_attr->min_rnr_timer = 4978c2ecf20Sopenharmony_ci (be32_to_cpu(context->rnr_nextrecvpsn) >> 24) & 0x1f; 4988c2ecf20Sopenharmony_ci qp_attr->timeout = context->pri_path.ackto >> 3; 4998c2ecf20Sopenharmony_ci qp_attr->retry_cnt = (be32_to_cpu(context->params1) >> 16) & 0x7; 5008c2ecf20Sopenharmony_ci qp_attr->rnr_retry = context->pri_path.rnr_retry >> 5; 5018c2ecf20Sopenharmony_ci qp_attr->alt_timeout = context->alt_path.ackto >> 3; 5028c2ecf20Sopenharmony_ci 5038c2ecf20Sopenharmony_cidone: 5048c2ecf20Sopenharmony_ci qp_attr->cur_qp_state = qp_attr->qp_state; 5058c2ecf20Sopenharmony_ci qp_attr->cap.max_send_wr = qp->sq.max; 5068c2ecf20Sopenharmony_ci qp_attr->cap.max_recv_wr = qp->rq.max; 5078c2ecf20Sopenharmony_ci qp_attr->cap.max_send_sge = qp->sq.max_gs; 5088c2ecf20Sopenharmony_ci qp_attr->cap.max_recv_sge = qp->rq.max_gs; 5098c2ecf20Sopenharmony_ci qp_attr->cap.max_inline_data = qp->max_inline_data; 5108c2ecf20Sopenharmony_ci 5118c2ecf20Sopenharmony_ci qp_init_attr->cap = qp_attr->cap; 5128c2ecf20Sopenharmony_ci qp_init_attr->sq_sig_type = qp->sq_policy; 5138c2ecf20Sopenharmony_ci 5148c2ecf20Sopenharmony_ciout_mailbox: 5158c2ecf20Sopenharmony_ci mthca_free_mailbox(dev, mailbox); 5168c2ecf20Sopenharmony_ci 5178c2ecf20Sopenharmony_ciout: 5188c2ecf20Sopenharmony_ci mutex_unlock(&qp->mutex); 5198c2ecf20Sopenharmony_ci return err; 5208c2ecf20Sopenharmony_ci} 5218c2ecf20Sopenharmony_ci 5228c2ecf20Sopenharmony_cistatic int mthca_path_set(struct mthca_dev *dev, const struct rdma_ah_attr *ah, 5238c2ecf20Sopenharmony_ci struct mthca_qp_path *path, u8 port) 5248c2ecf20Sopenharmony_ci{ 5258c2ecf20Sopenharmony_ci path->g_mylmc = rdma_ah_get_path_bits(ah) & 0x7f; 5268c2ecf20Sopenharmony_ci path->rlid = cpu_to_be16(rdma_ah_get_dlid(ah)); 5278c2ecf20Sopenharmony_ci path->static_rate = mthca_get_rate(dev, rdma_ah_get_static_rate(ah), 5288c2ecf20Sopenharmony_ci port); 5298c2ecf20Sopenharmony_ci 5308c2ecf20Sopenharmony_ci if (rdma_ah_get_ah_flags(ah) & IB_AH_GRH) { 5318c2ecf20Sopenharmony_ci const struct ib_global_route *grh = rdma_ah_read_grh(ah); 5328c2ecf20Sopenharmony_ci 5338c2ecf20Sopenharmony_ci if (grh->sgid_index >= dev->limits.gid_table_len) { 5348c2ecf20Sopenharmony_ci mthca_dbg(dev, "sgid_index (%u) too large. max is %d\n", 5358c2ecf20Sopenharmony_ci grh->sgid_index, 5368c2ecf20Sopenharmony_ci dev->limits.gid_table_len - 1); 5378c2ecf20Sopenharmony_ci return -1; 5388c2ecf20Sopenharmony_ci } 5398c2ecf20Sopenharmony_ci 5408c2ecf20Sopenharmony_ci path->g_mylmc |= 1 << 7; 5418c2ecf20Sopenharmony_ci path->mgid_index = grh->sgid_index; 5428c2ecf20Sopenharmony_ci path->hop_limit = grh->hop_limit; 5438c2ecf20Sopenharmony_ci path->sl_tclass_flowlabel = 5448c2ecf20Sopenharmony_ci cpu_to_be32((rdma_ah_get_sl(ah) << 28) | 5458c2ecf20Sopenharmony_ci (grh->traffic_class << 20) | 5468c2ecf20Sopenharmony_ci (grh->flow_label)); 5478c2ecf20Sopenharmony_ci memcpy(path->rgid, grh->dgid.raw, 16); 5488c2ecf20Sopenharmony_ci } else { 5498c2ecf20Sopenharmony_ci path->sl_tclass_flowlabel = cpu_to_be32(rdma_ah_get_sl(ah) << 5508c2ecf20Sopenharmony_ci 28); 5518c2ecf20Sopenharmony_ci } 5528c2ecf20Sopenharmony_ci 5538c2ecf20Sopenharmony_ci return 0; 5548c2ecf20Sopenharmony_ci} 5558c2ecf20Sopenharmony_ci 5568c2ecf20Sopenharmony_cistatic int __mthca_modify_qp(struct ib_qp *ibqp, 5578c2ecf20Sopenharmony_ci const struct ib_qp_attr *attr, int attr_mask, 5588c2ecf20Sopenharmony_ci enum ib_qp_state cur_state, 5598c2ecf20Sopenharmony_ci enum ib_qp_state new_state, 5608c2ecf20Sopenharmony_ci struct ib_udata *udata) 5618c2ecf20Sopenharmony_ci{ 5628c2ecf20Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 5638c2ecf20Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 5648c2ecf20Sopenharmony_ci struct mthca_ucontext *context = rdma_udata_to_drv_context( 5658c2ecf20Sopenharmony_ci udata, struct mthca_ucontext, ibucontext); 5668c2ecf20Sopenharmony_ci struct mthca_mailbox *mailbox; 5678c2ecf20Sopenharmony_ci struct mthca_qp_param *qp_param; 5688c2ecf20Sopenharmony_ci struct mthca_qp_context *qp_context; 5698c2ecf20Sopenharmony_ci u32 sqd_event = 0; 5708c2ecf20Sopenharmony_ci int err = -EINVAL; 5718c2ecf20Sopenharmony_ci 5728c2ecf20Sopenharmony_ci mailbox = mthca_alloc_mailbox(dev, GFP_KERNEL); 5738c2ecf20Sopenharmony_ci if (IS_ERR(mailbox)) { 5748c2ecf20Sopenharmony_ci err = PTR_ERR(mailbox); 5758c2ecf20Sopenharmony_ci goto out; 5768c2ecf20Sopenharmony_ci } 5778c2ecf20Sopenharmony_ci qp_param = mailbox->buf; 5788c2ecf20Sopenharmony_ci qp_context = &qp_param->context; 5798c2ecf20Sopenharmony_ci memset(qp_param, 0, sizeof *qp_param); 5808c2ecf20Sopenharmony_ci 5818c2ecf20Sopenharmony_ci qp_context->flags = cpu_to_be32((to_mthca_state(new_state) << 28) | 5828c2ecf20Sopenharmony_ci (to_mthca_st(qp->transport) << 16)); 5838c2ecf20Sopenharmony_ci qp_context->flags |= cpu_to_be32(MTHCA_QP_BIT_DE); 5848c2ecf20Sopenharmony_ci if (!(attr_mask & IB_QP_PATH_MIG_STATE)) 5858c2ecf20Sopenharmony_ci qp_context->flags |= cpu_to_be32(MTHCA_QP_PM_MIGRATED << 11); 5868c2ecf20Sopenharmony_ci else { 5878c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_PM_STATE); 5888c2ecf20Sopenharmony_ci switch (attr->path_mig_state) { 5898c2ecf20Sopenharmony_ci case IB_MIG_MIGRATED: 5908c2ecf20Sopenharmony_ci qp_context->flags |= cpu_to_be32(MTHCA_QP_PM_MIGRATED << 11); 5918c2ecf20Sopenharmony_ci break; 5928c2ecf20Sopenharmony_ci case IB_MIG_REARM: 5938c2ecf20Sopenharmony_ci qp_context->flags |= cpu_to_be32(MTHCA_QP_PM_REARM << 11); 5948c2ecf20Sopenharmony_ci break; 5958c2ecf20Sopenharmony_ci case IB_MIG_ARMED: 5968c2ecf20Sopenharmony_ci qp_context->flags |= cpu_to_be32(MTHCA_QP_PM_ARMED << 11); 5978c2ecf20Sopenharmony_ci break; 5988c2ecf20Sopenharmony_ci } 5998c2ecf20Sopenharmony_ci } 6008c2ecf20Sopenharmony_ci 6018c2ecf20Sopenharmony_ci /* leave tavor_sched_queue as 0 */ 6028c2ecf20Sopenharmony_ci 6038c2ecf20Sopenharmony_ci if (qp->transport == MLX || qp->transport == UD) 6048c2ecf20Sopenharmony_ci qp_context->mtu_msgmax = (IB_MTU_2048 << 5) | 11; 6058c2ecf20Sopenharmony_ci else if (attr_mask & IB_QP_PATH_MTU) { 6068c2ecf20Sopenharmony_ci if (attr->path_mtu < IB_MTU_256 || attr->path_mtu > IB_MTU_2048) { 6078c2ecf20Sopenharmony_ci mthca_dbg(dev, "path MTU (%u) is invalid\n", 6088c2ecf20Sopenharmony_ci attr->path_mtu); 6098c2ecf20Sopenharmony_ci goto out_mailbox; 6108c2ecf20Sopenharmony_ci } 6118c2ecf20Sopenharmony_ci qp_context->mtu_msgmax = (attr->path_mtu << 5) | 31; 6128c2ecf20Sopenharmony_ci } 6138c2ecf20Sopenharmony_ci 6148c2ecf20Sopenharmony_ci if (mthca_is_memfree(dev)) { 6158c2ecf20Sopenharmony_ci if (qp->rq.max) 6168c2ecf20Sopenharmony_ci qp_context->rq_size_stride = ilog2(qp->rq.max) << 3; 6178c2ecf20Sopenharmony_ci qp_context->rq_size_stride |= qp->rq.wqe_shift - 4; 6188c2ecf20Sopenharmony_ci 6198c2ecf20Sopenharmony_ci if (qp->sq.max) 6208c2ecf20Sopenharmony_ci qp_context->sq_size_stride = ilog2(qp->sq.max) << 3; 6218c2ecf20Sopenharmony_ci qp_context->sq_size_stride |= qp->sq.wqe_shift - 4; 6228c2ecf20Sopenharmony_ci } 6238c2ecf20Sopenharmony_ci 6248c2ecf20Sopenharmony_ci /* leave arbel_sched_queue as 0 */ 6258c2ecf20Sopenharmony_ci 6268c2ecf20Sopenharmony_ci if (qp->ibqp.uobject) 6278c2ecf20Sopenharmony_ci qp_context->usr_page = cpu_to_be32(context->uar.index); 6288c2ecf20Sopenharmony_ci else 6298c2ecf20Sopenharmony_ci qp_context->usr_page = cpu_to_be32(dev->driver_uar.index); 6308c2ecf20Sopenharmony_ci qp_context->local_qpn = cpu_to_be32(qp->qpn); 6318c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_DEST_QPN) { 6328c2ecf20Sopenharmony_ci qp_context->remote_qpn = cpu_to_be32(attr->dest_qp_num); 6338c2ecf20Sopenharmony_ci } 6348c2ecf20Sopenharmony_ci 6358c2ecf20Sopenharmony_ci if (qp->transport == MLX) 6368c2ecf20Sopenharmony_ci qp_context->pri_path.port_pkey |= 6378c2ecf20Sopenharmony_ci cpu_to_be32(qp->port << 24); 6388c2ecf20Sopenharmony_ci else { 6398c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_PORT) { 6408c2ecf20Sopenharmony_ci qp_context->pri_path.port_pkey |= 6418c2ecf20Sopenharmony_ci cpu_to_be32(attr->port_num << 24); 6428c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_PORT_NUM); 6438c2ecf20Sopenharmony_ci } 6448c2ecf20Sopenharmony_ci } 6458c2ecf20Sopenharmony_ci 6468c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_PKEY_INDEX) { 6478c2ecf20Sopenharmony_ci qp_context->pri_path.port_pkey |= 6488c2ecf20Sopenharmony_ci cpu_to_be32(attr->pkey_index); 6498c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_PKEY_INDEX); 6508c2ecf20Sopenharmony_ci } 6518c2ecf20Sopenharmony_ci 6528c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_RNR_RETRY) { 6538c2ecf20Sopenharmony_ci qp_context->alt_path.rnr_retry = qp_context->pri_path.rnr_retry = 6548c2ecf20Sopenharmony_ci attr->rnr_retry << 5; 6558c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_RNR_RETRY | 6568c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_ALT_RNR_RETRY); 6578c2ecf20Sopenharmony_ci } 6588c2ecf20Sopenharmony_ci 6598c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_AV) { 6608c2ecf20Sopenharmony_ci if (mthca_path_set(dev, &attr->ah_attr, &qp_context->pri_path, 6618c2ecf20Sopenharmony_ci attr_mask & IB_QP_PORT ? attr->port_num : qp->port)) 6628c2ecf20Sopenharmony_ci goto out_mailbox; 6638c2ecf20Sopenharmony_ci 6648c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_PRIMARY_ADDR_PATH); 6658c2ecf20Sopenharmony_ci } 6668c2ecf20Sopenharmony_ci 6678c2ecf20Sopenharmony_ci if (ibqp->qp_type == IB_QPT_RC && 6688c2ecf20Sopenharmony_ci cur_state == IB_QPS_INIT && new_state == IB_QPS_RTR) { 6698c2ecf20Sopenharmony_ci u8 sched_queue = ibqp->uobject ? 0x2 : 0x1; 6708c2ecf20Sopenharmony_ci 6718c2ecf20Sopenharmony_ci if (mthca_is_memfree(dev)) 6728c2ecf20Sopenharmony_ci qp_context->rlkey_arbel_sched_queue |= sched_queue; 6738c2ecf20Sopenharmony_ci else 6748c2ecf20Sopenharmony_ci qp_context->tavor_sched_queue |= cpu_to_be32(sched_queue); 6758c2ecf20Sopenharmony_ci 6768c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= 6778c2ecf20Sopenharmony_ci cpu_to_be32(MTHCA_QP_OPTPAR_SCHED_QUEUE); 6788c2ecf20Sopenharmony_ci } 6798c2ecf20Sopenharmony_ci 6808c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_TIMEOUT) { 6818c2ecf20Sopenharmony_ci qp_context->pri_path.ackto = attr->timeout << 3; 6828c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_ACK_TIMEOUT); 6838c2ecf20Sopenharmony_ci } 6848c2ecf20Sopenharmony_ci 6858c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_ALT_PATH) { 6868c2ecf20Sopenharmony_ci if (attr->alt_pkey_index >= dev->limits.pkey_table_len) { 6878c2ecf20Sopenharmony_ci mthca_dbg(dev, "Alternate P_Key index (%u) too large. max is %d\n", 6888c2ecf20Sopenharmony_ci attr->alt_pkey_index, dev->limits.pkey_table_len-1); 6898c2ecf20Sopenharmony_ci goto out_mailbox; 6908c2ecf20Sopenharmony_ci } 6918c2ecf20Sopenharmony_ci 6928c2ecf20Sopenharmony_ci if (attr->alt_port_num == 0 || attr->alt_port_num > dev->limits.num_ports) { 6938c2ecf20Sopenharmony_ci mthca_dbg(dev, "Alternate port number (%u) is invalid\n", 6948c2ecf20Sopenharmony_ci attr->alt_port_num); 6958c2ecf20Sopenharmony_ci goto out_mailbox; 6968c2ecf20Sopenharmony_ci } 6978c2ecf20Sopenharmony_ci 6988c2ecf20Sopenharmony_ci if (mthca_path_set(dev, &attr->alt_ah_attr, &qp_context->alt_path, 6998c2ecf20Sopenharmony_ci rdma_ah_get_port_num(&attr->alt_ah_attr))) 7008c2ecf20Sopenharmony_ci goto out_mailbox; 7018c2ecf20Sopenharmony_ci 7028c2ecf20Sopenharmony_ci qp_context->alt_path.port_pkey |= cpu_to_be32(attr->alt_pkey_index | 7038c2ecf20Sopenharmony_ci attr->alt_port_num << 24); 7048c2ecf20Sopenharmony_ci qp_context->alt_path.ackto = attr->alt_timeout << 3; 7058c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_ALT_ADDR_PATH); 7068c2ecf20Sopenharmony_ci } 7078c2ecf20Sopenharmony_ci 7088c2ecf20Sopenharmony_ci /* leave rdd as 0 */ 7098c2ecf20Sopenharmony_ci qp_context->pd = cpu_to_be32(to_mpd(ibqp->pd)->pd_num); 7108c2ecf20Sopenharmony_ci /* leave wqe_base as 0 (we always create an MR based at 0 for WQs) */ 7118c2ecf20Sopenharmony_ci qp_context->wqe_lkey = cpu_to_be32(qp->mr.ibmr.lkey); 7128c2ecf20Sopenharmony_ci qp_context->params1 = cpu_to_be32((MTHCA_ACK_REQ_FREQ << 28) | 7138c2ecf20Sopenharmony_ci (MTHCA_FLIGHT_LIMIT << 24) | 7148c2ecf20Sopenharmony_ci MTHCA_QP_BIT_SWE); 7158c2ecf20Sopenharmony_ci if (qp->sq_policy == IB_SIGNAL_ALL_WR) 7168c2ecf20Sopenharmony_ci qp_context->params1 |= cpu_to_be32(MTHCA_QP_BIT_SSC); 7178c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_RETRY_CNT) { 7188c2ecf20Sopenharmony_ci qp_context->params1 |= cpu_to_be32(attr->retry_cnt << 16); 7198c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_RETRY_COUNT); 7208c2ecf20Sopenharmony_ci } 7218c2ecf20Sopenharmony_ci 7228c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_MAX_QP_RD_ATOMIC) { 7238c2ecf20Sopenharmony_ci if (attr->max_rd_atomic) { 7248c2ecf20Sopenharmony_ci qp_context->params1 |= 7258c2ecf20Sopenharmony_ci cpu_to_be32(MTHCA_QP_BIT_SRE | 7268c2ecf20Sopenharmony_ci MTHCA_QP_BIT_SAE); 7278c2ecf20Sopenharmony_ci qp_context->params1 |= 7288c2ecf20Sopenharmony_ci cpu_to_be32(fls(attr->max_rd_atomic - 1) << 21); 7298c2ecf20Sopenharmony_ci } 7308c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_SRA_MAX); 7318c2ecf20Sopenharmony_ci } 7328c2ecf20Sopenharmony_ci 7338c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_SQ_PSN) 7348c2ecf20Sopenharmony_ci qp_context->next_send_psn = cpu_to_be32(attr->sq_psn); 7358c2ecf20Sopenharmony_ci qp_context->cqn_snd = cpu_to_be32(to_mcq(ibqp->send_cq)->cqn); 7368c2ecf20Sopenharmony_ci 7378c2ecf20Sopenharmony_ci if (mthca_is_memfree(dev)) { 7388c2ecf20Sopenharmony_ci qp_context->snd_wqe_base_l = cpu_to_be32(qp->send_wqe_offset); 7398c2ecf20Sopenharmony_ci qp_context->snd_db_index = cpu_to_be32(qp->sq.db_index); 7408c2ecf20Sopenharmony_ci } 7418c2ecf20Sopenharmony_ci 7428c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_MAX_DEST_RD_ATOMIC) { 7438c2ecf20Sopenharmony_ci if (attr->max_dest_rd_atomic) 7448c2ecf20Sopenharmony_ci qp_context->params2 |= 7458c2ecf20Sopenharmony_ci cpu_to_be32(fls(attr->max_dest_rd_atomic - 1) << 21); 7468c2ecf20Sopenharmony_ci 7478c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_RRA_MAX); 7488c2ecf20Sopenharmony_ci } 7498c2ecf20Sopenharmony_ci 7508c2ecf20Sopenharmony_ci if (attr_mask & (IB_QP_ACCESS_FLAGS | IB_QP_MAX_DEST_RD_ATOMIC)) { 7518c2ecf20Sopenharmony_ci qp_context->params2 |= get_hw_access_flags(qp, attr, attr_mask); 7528c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_RWE | 7538c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_RRE | 7548c2ecf20Sopenharmony_ci MTHCA_QP_OPTPAR_RAE); 7558c2ecf20Sopenharmony_ci } 7568c2ecf20Sopenharmony_ci 7578c2ecf20Sopenharmony_ci qp_context->params2 |= cpu_to_be32(MTHCA_QP_BIT_RSC); 7588c2ecf20Sopenharmony_ci 7598c2ecf20Sopenharmony_ci if (ibqp->srq) 7608c2ecf20Sopenharmony_ci qp_context->params2 |= cpu_to_be32(MTHCA_QP_BIT_RIC); 7618c2ecf20Sopenharmony_ci 7628c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_MIN_RNR_TIMER) { 7638c2ecf20Sopenharmony_ci qp_context->rnr_nextrecvpsn |= cpu_to_be32(attr->min_rnr_timer << 24); 7648c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_RNR_TIMEOUT); 7658c2ecf20Sopenharmony_ci } 7668c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_RQ_PSN) 7678c2ecf20Sopenharmony_ci qp_context->rnr_nextrecvpsn |= cpu_to_be32(attr->rq_psn); 7688c2ecf20Sopenharmony_ci 7698c2ecf20Sopenharmony_ci qp_context->ra_buff_indx = 7708c2ecf20Sopenharmony_ci cpu_to_be32(dev->qp_table.rdb_base + 7718c2ecf20Sopenharmony_ci ((qp->qpn & (dev->limits.num_qps - 1)) * MTHCA_RDB_ENTRY_SIZE << 7728c2ecf20Sopenharmony_ci dev->qp_table.rdb_shift)); 7738c2ecf20Sopenharmony_ci 7748c2ecf20Sopenharmony_ci qp_context->cqn_rcv = cpu_to_be32(to_mcq(ibqp->recv_cq)->cqn); 7758c2ecf20Sopenharmony_ci 7768c2ecf20Sopenharmony_ci if (mthca_is_memfree(dev)) 7778c2ecf20Sopenharmony_ci qp_context->rcv_db_index = cpu_to_be32(qp->rq.db_index); 7788c2ecf20Sopenharmony_ci 7798c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_QKEY) { 7808c2ecf20Sopenharmony_ci qp_context->qkey = cpu_to_be32(attr->qkey); 7818c2ecf20Sopenharmony_ci qp_param->opt_param_mask |= cpu_to_be32(MTHCA_QP_OPTPAR_Q_KEY); 7828c2ecf20Sopenharmony_ci } 7838c2ecf20Sopenharmony_ci 7848c2ecf20Sopenharmony_ci if (ibqp->srq) 7858c2ecf20Sopenharmony_ci qp_context->srqn = cpu_to_be32(1 << 24 | 7868c2ecf20Sopenharmony_ci to_msrq(ibqp->srq)->srqn); 7878c2ecf20Sopenharmony_ci 7888c2ecf20Sopenharmony_ci if (cur_state == IB_QPS_RTS && new_state == IB_QPS_SQD && 7898c2ecf20Sopenharmony_ci attr_mask & IB_QP_EN_SQD_ASYNC_NOTIFY && 7908c2ecf20Sopenharmony_ci attr->en_sqd_async_notify) 7918c2ecf20Sopenharmony_ci sqd_event = 1 << 31; 7928c2ecf20Sopenharmony_ci 7938c2ecf20Sopenharmony_ci err = mthca_MODIFY_QP(dev, cur_state, new_state, qp->qpn, 0, 7948c2ecf20Sopenharmony_ci mailbox, sqd_event); 7958c2ecf20Sopenharmony_ci if (err) { 7968c2ecf20Sopenharmony_ci mthca_warn(dev, "modify QP %d->%d returned %d.\n", 7978c2ecf20Sopenharmony_ci cur_state, new_state, err); 7988c2ecf20Sopenharmony_ci goto out_mailbox; 7998c2ecf20Sopenharmony_ci } 8008c2ecf20Sopenharmony_ci 8018c2ecf20Sopenharmony_ci qp->state = new_state; 8028c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_ACCESS_FLAGS) 8038c2ecf20Sopenharmony_ci qp->atomic_rd_en = attr->qp_access_flags; 8048c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_MAX_DEST_RD_ATOMIC) 8058c2ecf20Sopenharmony_ci qp->resp_depth = attr->max_dest_rd_atomic; 8068c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_PORT) 8078c2ecf20Sopenharmony_ci qp->port = attr->port_num; 8088c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_ALT_PATH) 8098c2ecf20Sopenharmony_ci qp->alt_port = attr->alt_port_num; 8108c2ecf20Sopenharmony_ci 8118c2ecf20Sopenharmony_ci if (is_sqp(dev, qp)) 8128c2ecf20Sopenharmony_ci store_attrs(qp->sqp, attr, attr_mask); 8138c2ecf20Sopenharmony_ci 8148c2ecf20Sopenharmony_ci /* 8158c2ecf20Sopenharmony_ci * If we moved QP0 to RTR, bring the IB link up; if we moved 8168c2ecf20Sopenharmony_ci * QP0 to RESET or ERROR, bring the link back down. 8178c2ecf20Sopenharmony_ci */ 8188c2ecf20Sopenharmony_ci if (is_qp0(dev, qp)) { 8198c2ecf20Sopenharmony_ci if (cur_state != IB_QPS_RTR && 8208c2ecf20Sopenharmony_ci new_state == IB_QPS_RTR) 8218c2ecf20Sopenharmony_ci init_port(dev, qp->port); 8228c2ecf20Sopenharmony_ci 8238c2ecf20Sopenharmony_ci if (cur_state != IB_QPS_RESET && 8248c2ecf20Sopenharmony_ci cur_state != IB_QPS_ERR && 8258c2ecf20Sopenharmony_ci (new_state == IB_QPS_RESET || 8268c2ecf20Sopenharmony_ci new_state == IB_QPS_ERR)) 8278c2ecf20Sopenharmony_ci mthca_CLOSE_IB(dev, qp->port); 8288c2ecf20Sopenharmony_ci } 8298c2ecf20Sopenharmony_ci 8308c2ecf20Sopenharmony_ci /* 8318c2ecf20Sopenharmony_ci * If we moved a kernel QP to RESET, clean up all old CQ 8328c2ecf20Sopenharmony_ci * entries and reinitialize the QP. 8338c2ecf20Sopenharmony_ci */ 8348c2ecf20Sopenharmony_ci if (new_state == IB_QPS_RESET && !qp->ibqp.uobject) { 8358c2ecf20Sopenharmony_ci mthca_cq_clean(dev, to_mcq(qp->ibqp.recv_cq), qp->qpn, 8368c2ecf20Sopenharmony_ci qp->ibqp.srq ? to_msrq(qp->ibqp.srq) : NULL); 8378c2ecf20Sopenharmony_ci if (qp->ibqp.send_cq != qp->ibqp.recv_cq) 8388c2ecf20Sopenharmony_ci mthca_cq_clean(dev, to_mcq(qp->ibqp.send_cq), qp->qpn, NULL); 8398c2ecf20Sopenharmony_ci 8408c2ecf20Sopenharmony_ci mthca_wq_reset(&qp->sq); 8418c2ecf20Sopenharmony_ci qp->sq.last = get_send_wqe(qp, qp->sq.max - 1); 8428c2ecf20Sopenharmony_ci 8438c2ecf20Sopenharmony_ci mthca_wq_reset(&qp->rq); 8448c2ecf20Sopenharmony_ci qp->rq.last = get_recv_wqe(qp, qp->rq.max - 1); 8458c2ecf20Sopenharmony_ci 8468c2ecf20Sopenharmony_ci if (mthca_is_memfree(dev)) { 8478c2ecf20Sopenharmony_ci *qp->sq.db = 0; 8488c2ecf20Sopenharmony_ci *qp->rq.db = 0; 8498c2ecf20Sopenharmony_ci } 8508c2ecf20Sopenharmony_ci } 8518c2ecf20Sopenharmony_ci 8528c2ecf20Sopenharmony_ciout_mailbox: 8538c2ecf20Sopenharmony_ci mthca_free_mailbox(dev, mailbox); 8548c2ecf20Sopenharmony_ciout: 8558c2ecf20Sopenharmony_ci return err; 8568c2ecf20Sopenharmony_ci} 8578c2ecf20Sopenharmony_ci 8588c2ecf20Sopenharmony_ciint mthca_modify_qp(struct ib_qp *ibqp, struct ib_qp_attr *attr, int attr_mask, 8598c2ecf20Sopenharmony_ci struct ib_udata *udata) 8608c2ecf20Sopenharmony_ci{ 8618c2ecf20Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 8628c2ecf20Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 8638c2ecf20Sopenharmony_ci enum ib_qp_state cur_state, new_state; 8648c2ecf20Sopenharmony_ci int err = -EINVAL; 8658c2ecf20Sopenharmony_ci 8668c2ecf20Sopenharmony_ci mutex_lock(&qp->mutex); 8678c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_CUR_STATE) { 8688c2ecf20Sopenharmony_ci cur_state = attr->cur_qp_state; 8698c2ecf20Sopenharmony_ci } else { 8708c2ecf20Sopenharmony_ci spin_lock_irq(&qp->sq.lock); 8718c2ecf20Sopenharmony_ci spin_lock(&qp->rq.lock); 8728c2ecf20Sopenharmony_ci cur_state = qp->state; 8738c2ecf20Sopenharmony_ci spin_unlock(&qp->rq.lock); 8748c2ecf20Sopenharmony_ci spin_unlock_irq(&qp->sq.lock); 8758c2ecf20Sopenharmony_ci } 8768c2ecf20Sopenharmony_ci 8778c2ecf20Sopenharmony_ci new_state = attr_mask & IB_QP_STATE ? attr->qp_state : cur_state; 8788c2ecf20Sopenharmony_ci 8798c2ecf20Sopenharmony_ci if (!ib_modify_qp_is_ok(cur_state, new_state, ibqp->qp_type, 8808c2ecf20Sopenharmony_ci attr_mask)) { 8818c2ecf20Sopenharmony_ci mthca_dbg(dev, "Bad QP transition (transport %d) " 8828c2ecf20Sopenharmony_ci "%d->%d with attr 0x%08x\n", 8838c2ecf20Sopenharmony_ci qp->transport, cur_state, new_state, 8848c2ecf20Sopenharmony_ci attr_mask); 8858c2ecf20Sopenharmony_ci goto out; 8868c2ecf20Sopenharmony_ci } 8878c2ecf20Sopenharmony_ci 8888c2ecf20Sopenharmony_ci if ((attr_mask & IB_QP_PKEY_INDEX) && 8898c2ecf20Sopenharmony_ci attr->pkey_index >= dev->limits.pkey_table_len) { 8908c2ecf20Sopenharmony_ci mthca_dbg(dev, "P_Key index (%u) too large. max is %d\n", 8918c2ecf20Sopenharmony_ci attr->pkey_index, dev->limits.pkey_table_len-1); 8928c2ecf20Sopenharmony_ci goto out; 8938c2ecf20Sopenharmony_ci } 8948c2ecf20Sopenharmony_ci 8958c2ecf20Sopenharmony_ci if ((attr_mask & IB_QP_PORT) && 8968c2ecf20Sopenharmony_ci (attr->port_num == 0 || attr->port_num > dev->limits.num_ports)) { 8978c2ecf20Sopenharmony_ci mthca_dbg(dev, "Port number (%u) is invalid\n", attr->port_num); 8988c2ecf20Sopenharmony_ci goto out; 8998c2ecf20Sopenharmony_ci } 9008c2ecf20Sopenharmony_ci 9018c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_MAX_QP_RD_ATOMIC && 9028c2ecf20Sopenharmony_ci attr->max_rd_atomic > dev->limits.max_qp_init_rdma) { 9038c2ecf20Sopenharmony_ci mthca_dbg(dev, "Max rdma_atomic as initiator %u too large (max is %d)\n", 9048c2ecf20Sopenharmony_ci attr->max_rd_atomic, dev->limits.max_qp_init_rdma); 9058c2ecf20Sopenharmony_ci goto out; 9068c2ecf20Sopenharmony_ci } 9078c2ecf20Sopenharmony_ci 9088c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_MAX_DEST_RD_ATOMIC && 9098c2ecf20Sopenharmony_ci attr->max_dest_rd_atomic > 1 << dev->qp_table.rdb_shift) { 9108c2ecf20Sopenharmony_ci mthca_dbg(dev, "Max rdma_atomic as responder %u too large (max %d)\n", 9118c2ecf20Sopenharmony_ci attr->max_dest_rd_atomic, 1 << dev->qp_table.rdb_shift); 9128c2ecf20Sopenharmony_ci goto out; 9138c2ecf20Sopenharmony_ci } 9148c2ecf20Sopenharmony_ci 9158c2ecf20Sopenharmony_ci if (cur_state == new_state && cur_state == IB_QPS_RESET) { 9168c2ecf20Sopenharmony_ci err = 0; 9178c2ecf20Sopenharmony_ci goto out; 9188c2ecf20Sopenharmony_ci } 9198c2ecf20Sopenharmony_ci 9208c2ecf20Sopenharmony_ci err = __mthca_modify_qp(ibqp, attr, attr_mask, cur_state, new_state, 9218c2ecf20Sopenharmony_ci udata); 9228c2ecf20Sopenharmony_ci 9238c2ecf20Sopenharmony_ciout: 9248c2ecf20Sopenharmony_ci mutex_unlock(&qp->mutex); 9258c2ecf20Sopenharmony_ci return err; 9268c2ecf20Sopenharmony_ci} 9278c2ecf20Sopenharmony_ci 9288c2ecf20Sopenharmony_cistatic int mthca_max_data_size(struct mthca_dev *dev, struct mthca_qp *qp, int desc_sz) 9298c2ecf20Sopenharmony_ci{ 9308c2ecf20Sopenharmony_ci /* 9318c2ecf20Sopenharmony_ci * Calculate the maximum size of WQE s/g segments, excluding 9328c2ecf20Sopenharmony_ci * the next segment and other non-data segments. 9338c2ecf20Sopenharmony_ci */ 9348c2ecf20Sopenharmony_ci int max_data_size = desc_sz - sizeof (struct mthca_next_seg); 9358c2ecf20Sopenharmony_ci 9368c2ecf20Sopenharmony_ci switch (qp->transport) { 9378c2ecf20Sopenharmony_ci case MLX: 9388c2ecf20Sopenharmony_ci max_data_size -= 2 * sizeof (struct mthca_data_seg); 9398c2ecf20Sopenharmony_ci break; 9408c2ecf20Sopenharmony_ci 9418c2ecf20Sopenharmony_ci case UD: 9428c2ecf20Sopenharmony_ci if (mthca_is_memfree(dev)) 9438c2ecf20Sopenharmony_ci max_data_size -= sizeof (struct mthca_arbel_ud_seg); 9448c2ecf20Sopenharmony_ci else 9458c2ecf20Sopenharmony_ci max_data_size -= sizeof (struct mthca_tavor_ud_seg); 9468c2ecf20Sopenharmony_ci break; 9478c2ecf20Sopenharmony_ci 9488c2ecf20Sopenharmony_ci default: 9498c2ecf20Sopenharmony_ci max_data_size -= sizeof (struct mthca_raddr_seg); 9508c2ecf20Sopenharmony_ci break; 9518c2ecf20Sopenharmony_ci } 9528c2ecf20Sopenharmony_ci 9538c2ecf20Sopenharmony_ci return max_data_size; 9548c2ecf20Sopenharmony_ci} 9558c2ecf20Sopenharmony_ci 9568c2ecf20Sopenharmony_cistatic inline int mthca_max_inline_data(struct mthca_pd *pd, int max_data_size) 9578c2ecf20Sopenharmony_ci{ 9588c2ecf20Sopenharmony_ci /* We don't support inline data for kernel QPs (yet). */ 9598c2ecf20Sopenharmony_ci return pd->ibpd.uobject ? max_data_size - MTHCA_INLINE_HEADER_SIZE : 0; 9608c2ecf20Sopenharmony_ci} 9618c2ecf20Sopenharmony_ci 9628c2ecf20Sopenharmony_cistatic void mthca_adjust_qp_caps(struct mthca_dev *dev, 9638c2ecf20Sopenharmony_ci struct mthca_pd *pd, 9648c2ecf20Sopenharmony_ci struct mthca_qp *qp) 9658c2ecf20Sopenharmony_ci{ 9668c2ecf20Sopenharmony_ci int max_data_size = mthca_max_data_size(dev, qp, 9678c2ecf20Sopenharmony_ci min(dev->limits.max_desc_sz, 9688c2ecf20Sopenharmony_ci 1 << qp->sq.wqe_shift)); 9698c2ecf20Sopenharmony_ci 9708c2ecf20Sopenharmony_ci qp->max_inline_data = mthca_max_inline_data(pd, max_data_size); 9718c2ecf20Sopenharmony_ci 9728c2ecf20Sopenharmony_ci qp->sq.max_gs = min_t(int, dev->limits.max_sg, 9738c2ecf20Sopenharmony_ci max_data_size / sizeof (struct mthca_data_seg)); 9748c2ecf20Sopenharmony_ci qp->rq.max_gs = min_t(int, dev->limits.max_sg, 9758c2ecf20Sopenharmony_ci (min(dev->limits.max_desc_sz, 1 << qp->rq.wqe_shift) - 9768c2ecf20Sopenharmony_ci sizeof (struct mthca_next_seg)) / 9778c2ecf20Sopenharmony_ci sizeof (struct mthca_data_seg)); 9788c2ecf20Sopenharmony_ci} 9798c2ecf20Sopenharmony_ci 9808c2ecf20Sopenharmony_ci/* 9818c2ecf20Sopenharmony_ci * Allocate and register buffer for WQEs. qp->rq.max, sq.max, 9828c2ecf20Sopenharmony_ci * rq.max_gs and sq.max_gs must all be assigned. 9838c2ecf20Sopenharmony_ci * mthca_alloc_wqe_buf will calculate rq.wqe_shift and 9848c2ecf20Sopenharmony_ci * sq.wqe_shift (as well as send_wqe_offset, is_direct, and 9858c2ecf20Sopenharmony_ci * queue) 9868c2ecf20Sopenharmony_ci */ 9878c2ecf20Sopenharmony_cistatic int mthca_alloc_wqe_buf(struct mthca_dev *dev, 9888c2ecf20Sopenharmony_ci struct mthca_pd *pd, 9898c2ecf20Sopenharmony_ci struct mthca_qp *qp, 9908c2ecf20Sopenharmony_ci struct ib_udata *udata) 9918c2ecf20Sopenharmony_ci{ 9928c2ecf20Sopenharmony_ci int size; 9938c2ecf20Sopenharmony_ci int err = -ENOMEM; 9948c2ecf20Sopenharmony_ci 9958c2ecf20Sopenharmony_ci size = sizeof (struct mthca_next_seg) + 9968c2ecf20Sopenharmony_ci qp->rq.max_gs * sizeof (struct mthca_data_seg); 9978c2ecf20Sopenharmony_ci 9988c2ecf20Sopenharmony_ci if (size > dev->limits.max_desc_sz) 9998c2ecf20Sopenharmony_ci return -EINVAL; 10008c2ecf20Sopenharmony_ci 10018c2ecf20Sopenharmony_ci for (qp->rq.wqe_shift = 6; 1 << qp->rq.wqe_shift < size; 10028c2ecf20Sopenharmony_ci qp->rq.wqe_shift++) 10038c2ecf20Sopenharmony_ci ; /* nothing */ 10048c2ecf20Sopenharmony_ci 10058c2ecf20Sopenharmony_ci size = qp->sq.max_gs * sizeof (struct mthca_data_seg); 10068c2ecf20Sopenharmony_ci switch (qp->transport) { 10078c2ecf20Sopenharmony_ci case MLX: 10088c2ecf20Sopenharmony_ci size += 2 * sizeof (struct mthca_data_seg); 10098c2ecf20Sopenharmony_ci break; 10108c2ecf20Sopenharmony_ci 10118c2ecf20Sopenharmony_ci case UD: 10128c2ecf20Sopenharmony_ci size += mthca_is_memfree(dev) ? 10138c2ecf20Sopenharmony_ci sizeof (struct mthca_arbel_ud_seg) : 10148c2ecf20Sopenharmony_ci sizeof (struct mthca_tavor_ud_seg); 10158c2ecf20Sopenharmony_ci break; 10168c2ecf20Sopenharmony_ci 10178c2ecf20Sopenharmony_ci case UC: 10188c2ecf20Sopenharmony_ci size += sizeof (struct mthca_raddr_seg); 10198c2ecf20Sopenharmony_ci break; 10208c2ecf20Sopenharmony_ci 10218c2ecf20Sopenharmony_ci case RC: 10228c2ecf20Sopenharmony_ci size += sizeof (struct mthca_raddr_seg); 10238c2ecf20Sopenharmony_ci /* 10248c2ecf20Sopenharmony_ci * An atomic op will require an atomic segment, a 10258c2ecf20Sopenharmony_ci * remote address segment and one scatter entry. 10268c2ecf20Sopenharmony_ci */ 10278c2ecf20Sopenharmony_ci size = max_t(int, size, 10288c2ecf20Sopenharmony_ci sizeof (struct mthca_atomic_seg) + 10298c2ecf20Sopenharmony_ci sizeof (struct mthca_raddr_seg) + 10308c2ecf20Sopenharmony_ci sizeof (struct mthca_data_seg)); 10318c2ecf20Sopenharmony_ci break; 10328c2ecf20Sopenharmony_ci 10338c2ecf20Sopenharmony_ci default: 10348c2ecf20Sopenharmony_ci break; 10358c2ecf20Sopenharmony_ci } 10368c2ecf20Sopenharmony_ci 10378c2ecf20Sopenharmony_ci /* Make sure that we have enough space for a bind request */ 10388c2ecf20Sopenharmony_ci size = max_t(int, size, sizeof (struct mthca_bind_seg)); 10398c2ecf20Sopenharmony_ci 10408c2ecf20Sopenharmony_ci size += sizeof (struct mthca_next_seg); 10418c2ecf20Sopenharmony_ci 10428c2ecf20Sopenharmony_ci if (size > dev->limits.max_desc_sz) 10438c2ecf20Sopenharmony_ci return -EINVAL; 10448c2ecf20Sopenharmony_ci 10458c2ecf20Sopenharmony_ci for (qp->sq.wqe_shift = 6; 1 << qp->sq.wqe_shift < size; 10468c2ecf20Sopenharmony_ci qp->sq.wqe_shift++) 10478c2ecf20Sopenharmony_ci ; /* nothing */ 10488c2ecf20Sopenharmony_ci 10498c2ecf20Sopenharmony_ci qp->send_wqe_offset = ALIGN(qp->rq.max << qp->rq.wqe_shift, 10508c2ecf20Sopenharmony_ci 1 << qp->sq.wqe_shift); 10518c2ecf20Sopenharmony_ci 10528c2ecf20Sopenharmony_ci /* 10538c2ecf20Sopenharmony_ci * If this is a userspace QP, we don't actually have to 10548c2ecf20Sopenharmony_ci * allocate anything. All we need is to calculate the WQE 10558c2ecf20Sopenharmony_ci * sizes and the send_wqe_offset, so we're done now. 10568c2ecf20Sopenharmony_ci */ 10578c2ecf20Sopenharmony_ci if (udata) 10588c2ecf20Sopenharmony_ci return 0; 10598c2ecf20Sopenharmony_ci 10608c2ecf20Sopenharmony_ci size = PAGE_ALIGN(qp->send_wqe_offset + 10618c2ecf20Sopenharmony_ci (qp->sq.max << qp->sq.wqe_shift)); 10628c2ecf20Sopenharmony_ci 10638c2ecf20Sopenharmony_ci qp->wrid = kmalloc_array(qp->rq.max + qp->sq.max, sizeof(u64), 10648c2ecf20Sopenharmony_ci GFP_KERNEL); 10658c2ecf20Sopenharmony_ci if (!qp->wrid) 10668c2ecf20Sopenharmony_ci goto err_out; 10678c2ecf20Sopenharmony_ci 10688c2ecf20Sopenharmony_ci err = mthca_buf_alloc(dev, size, MTHCA_MAX_DIRECT_QP_SIZE, 10698c2ecf20Sopenharmony_ci &qp->queue, &qp->is_direct, pd, 0, &qp->mr); 10708c2ecf20Sopenharmony_ci if (err) 10718c2ecf20Sopenharmony_ci goto err_out; 10728c2ecf20Sopenharmony_ci 10738c2ecf20Sopenharmony_ci return 0; 10748c2ecf20Sopenharmony_ci 10758c2ecf20Sopenharmony_cierr_out: 10768c2ecf20Sopenharmony_ci kfree(qp->wrid); 10778c2ecf20Sopenharmony_ci return err; 10788c2ecf20Sopenharmony_ci} 10798c2ecf20Sopenharmony_ci 10808c2ecf20Sopenharmony_cistatic void mthca_free_wqe_buf(struct mthca_dev *dev, 10818c2ecf20Sopenharmony_ci struct mthca_qp *qp) 10828c2ecf20Sopenharmony_ci{ 10838c2ecf20Sopenharmony_ci mthca_buf_free(dev, PAGE_ALIGN(qp->send_wqe_offset + 10848c2ecf20Sopenharmony_ci (qp->sq.max << qp->sq.wqe_shift)), 10858c2ecf20Sopenharmony_ci &qp->queue, qp->is_direct, &qp->mr); 10868c2ecf20Sopenharmony_ci kfree(qp->wrid); 10878c2ecf20Sopenharmony_ci} 10888c2ecf20Sopenharmony_ci 10898c2ecf20Sopenharmony_cistatic int mthca_map_memfree(struct mthca_dev *dev, 10908c2ecf20Sopenharmony_ci struct mthca_qp *qp) 10918c2ecf20Sopenharmony_ci{ 10928c2ecf20Sopenharmony_ci int ret; 10938c2ecf20Sopenharmony_ci 10948c2ecf20Sopenharmony_ci if (mthca_is_memfree(dev)) { 10958c2ecf20Sopenharmony_ci ret = mthca_table_get(dev, dev->qp_table.qp_table, qp->qpn); 10968c2ecf20Sopenharmony_ci if (ret) 10978c2ecf20Sopenharmony_ci return ret; 10988c2ecf20Sopenharmony_ci 10998c2ecf20Sopenharmony_ci ret = mthca_table_get(dev, dev->qp_table.eqp_table, qp->qpn); 11008c2ecf20Sopenharmony_ci if (ret) 11018c2ecf20Sopenharmony_ci goto err_qpc; 11028c2ecf20Sopenharmony_ci 11038c2ecf20Sopenharmony_ci ret = mthca_table_get(dev, dev->qp_table.rdb_table, 11048c2ecf20Sopenharmony_ci qp->qpn << dev->qp_table.rdb_shift); 11058c2ecf20Sopenharmony_ci if (ret) 11068c2ecf20Sopenharmony_ci goto err_eqpc; 11078c2ecf20Sopenharmony_ci 11088c2ecf20Sopenharmony_ci } 11098c2ecf20Sopenharmony_ci 11108c2ecf20Sopenharmony_ci return 0; 11118c2ecf20Sopenharmony_ci 11128c2ecf20Sopenharmony_cierr_eqpc: 11138c2ecf20Sopenharmony_ci mthca_table_put(dev, dev->qp_table.eqp_table, qp->qpn); 11148c2ecf20Sopenharmony_ci 11158c2ecf20Sopenharmony_cierr_qpc: 11168c2ecf20Sopenharmony_ci mthca_table_put(dev, dev->qp_table.qp_table, qp->qpn); 11178c2ecf20Sopenharmony_ci 11188c2ecf20Sopenharmony_ci return ret; 11198c2ecf20Sopenharmony_ci} 11208c2ecf20Sopenharmony_ci 11218c2ecf20Sopenharmony_cistatic void mthca_unmap_memfree(struct mthca_dev *dev, 11228c2ecf20Sopenharmony_ci struct mthca_qp *qp) 11238c2ecf20Sopenharmony_ci{ 11248c2ecf20Sopenharmony_ci mthca_table_put(dev, dev->qp_table.rdb_table, 11258c2ecf20Sopenharmony_ci qp->qpn << dev->qp_table.rdb_shift); 11268c2ecf20Sopenharmony_ci mthca_table_put(dev, dev->qp_table.eqp_table, qp->qpn); 11278c2ecf20Sopenharmony_ci mthca_table_put(dev, dev->qp_table.qp_table, qp->qpn); 11288c2ecf20Sopenharmony_ci} 11298c2ecf20Sopenharmony_ci 11308c2ecf20Sopenharmony_cistatic int mthca_alloc_memfree(struct mthca_dev *dev, 11318c2ecf20Sopenharmony_ci struct mthca_qp *qp) 11328c2ecf20Sopenharmony_ci{ 11338c2ecf20Sopenharmony_ci if (mthca_is_memfree(dev)) { 11348c2ecf20Sopenharmony_ci qp->rq.db_index = mthca_alloc_db(dev, MTHCA_DB_TYPE_RQ, 11358c2ecf20Sopenharmony_ci qp->qpn, &qp->rq.db); 11368c2ecf20Sopenharmony_ci if (qp->rq.db_index < 0) 11378c2ecf20Sopenharmony_ci return -ENOMEM; 11388c2ecf20Sopenharmony_ci 11398c2ecf20Sopenharmony_ci qp->sq.db_index = mthca_alloc_db(dev, MTHCA_DB_TYPE_SQ, 11408c2ecf20Sopenharmony_ci qp->qpn, &qp->sq.db); 11418c2ecf20Sopenharmony_ci if (qp->sq.db_index < 0) { 11428c2ecf20Sopenharmony_ci mthca_free_db(dev, MTHCA_DB_TYPE_RQ, qp->rq.db_index); 11438c2ecf20Sopenharmony_ci return -ENOMEM; 11448c2ecf20Sopenharmony_ci } 11458c2ecf20Sopenharmony_ci } 11468c2ecf20Sopenharmony_ci 11478c2ecf20Sopenharmony_ci return 0; 11488c2ecf20Sopenharmony_ci} 11498c2ecf20Sopenharmony_ci 11508c2ecf20Sopenharmony_cistatic void mthca_free_memfree(struct mthca_dev *dev, 11518c2ecf20Sopenharmony_ci struct mthca_qp *qp) 11528c2ecf20Sopenharmony_ci{ 11538c2ecf20Sopenharmony_ci if (mthca_is_memfree(dev)) { 11548c2ecf20Sopenharmony_ci mthca_free_db(dev, MTHCA_DB_TYPE_SQ, qp->sq.db_index); 11558c2ecf20Sopenharmony_ci mthca_free_db(dev, MTHCA_DB_TYPE_RQ, qp->rq.db_index); 11568c2ecf20Sopenharmony_ci } 11578c2ecf20Sopenharmony_ci} 11588c2ecf20Sopenharmony_ci 11598c2ecf20Sopenharmony_cistatic int mthca_alloc_qp_common(struct mthca_dev *dev, 11608c2ecf20Sopenharmony_ci struct mthca_pd *pd, 11618c2ecf20Sopenharmony_ci struct mthca_cq *send_cq, 11628c2ecf20Sopenharmony_ci struct mthca_cq *recv_cq, 11638c2ecf20Sopenharmony_ci enum ib_sig_type send_policy, 11648c2ecf20Sopenharmony_ci struct mthca_qp *qp, 11658c2ecf20Sopenharmony_ci struct ib_udata *udata) 11668c2ecf20Sopenharmony_ci{ 11678c2ecf20Sopenharmony_ci int ret; 11688c2ecf20Sopenharmony_ci int i; 11698c2ecf20Sopenharmony_ci struct mthca_next_seg *next; 11708c2ecf20Sopenharmony_ci 11718c2ecf20Sopenharmony_ci qp->refcount = 1; 11728c2ecf20Sopenharmony_ci init_waitqueue_head(&qp->wait); 11738c2ecf20Sopenharmony_ci mutex_init(&qp->mutex); 11748c2ecf20Sopenharmony_ci qp->state = IB_QPS_RESET; 11758c2ecf20Sopenharmony_ci qp->atomic_rd_en = 0; 11768c2ecf20Sopenharmony_ci qp->resp_depth = 0; 11778c2ecf20Sopenharmony_ci qp->sq_policy = send_policy; 11788c2ecf20Sopenharmony_ci mthca_wq_reset(&qp->sq); 11798c2ecf20Sopenharmony_ci mthca_wq_reset(&qp->rq); 11808c2ecf20Sopenharmony_ci 11818c2ecf20Sopenharmony_ci spin_lock_init(&qp->sq.lock); 11828c2ecf20Sopenharmony_ci spin_lock_init(&qp->rq.lock); 11838c2ecf20Sopenharmony_ci 11848c2ecf20Sopenharmony_ci ret = mthca_map_memfree(dev, qp); 11858c2ecf20Sopenharmony_ci if (ret) 11868c2ecf20Sopenharmony_ci return ret; 11878c2ecf20Sopenharmony_ci 11888c2ecf20Sopenharmony_ci ret = mthca_alloc_wqe_buf(dev, pd, qp, udata); 11898c2ecf20Sopenharmony_ci if (ret) { 11908c2ecf20Sopenharmony_ci mthca_unmap_memfree(dev, qp); 11918c2ecf20Sopenharmony_ci return ret; 11928c2ecf20Sopenharmony_ci } 11938c2ecf20Sopenharmony_ci 11948c2ecf20Sopenharmony_ci mthca_adjust_qp_caps(dev, pd, qp); 11958c2ecf20Sopenharmony_ci 11968c2ecf20Sopenharmony_ci /* 11978c2ecf20Sopenharmony_ci * If this is a userspace QP, we're done now. The doorbells 11988c2ecf20Sopenharmony_ci * will be allocated and buffers will be initialized in 11998c2ecf20Sopenharmony_ci * userspace. 12008c2ecf20Sopenharmony_ci */ 12018c2ecf20Sopenharmony_ci if (udata) 12028c2ecf20Sopenharmony_ci return 0; 12038c2ecf20Sopenharmony_ci 12048c2ecf20Sopenharmony_ci ret = mthca_alloc_memfree(dev, qp); 12058c2ecf20Sopenharmony_ci if (ret) { 12068c2ecf20Sopenharmony_ci mthca_free_wqe_buf(dev, qp); 12078c2ecf20Sopenharmony_ci mthca_unmap_memfree(dev, qp); 12088c2ecf20Sopenharmony_ci return ret; 12098c2ecf20Sopenharmony_ci } 12108c2ecf20Sopenharmony_ci 12118c2ecf20Sopenharmony_ci if (mthca_is_memfree(dev)) { 12128c2ecf20Sopenharmony_ci struct mthca_data_seg *scatter; 12138c2ecf20Sopenharmony_ci int size = (sizeof (struct mthca_next_seg) + 12148c2ecf20Sopenharmony_ci qp->rq.max_gs * sizeof (struct mthca_data_seg)) / 16; 12158c2ecf20Sopenharmony_ci 12168c2ecf20Sopenharmony_ci for (i = 0; i < qp->rq.max; ++i) { 12178c2ecf20Sopenharmony_ci next = get_recv_wqe(qp, i); 12188c2ecf20Sopenharmony_ci next->nda_op = cpu_to_be32(((i + 1) & (qp->rq.max - 1)) << 12198c2ecf20Sopenharmony_ci qp->rq.wqe_shift); 12208c2ecf20Sopenharmony_ci next->ee_nds = cpu_to_be32(size); 12218c2ecf20Sopenharmony_ci 12228c2ecf20Sopenharmony_ci for (scatter = (void *) (next + 1); 12238c2ecf20Sopenharmony_ci (void *) scatter < (void *) next + (1 << qp->rq.wqe_shift); 12248c2ecf20Sopenharmony_ci ++scatter) 12258c2ecf20Sopenharmony_ci scatter->lkey = cpu_to_be32(MTHCA_INVAL_LKEY); 12268c2ecf20Sopenharmony_ci } 12278c2ecf20Sopenharmony_ci 12288c2ecf20Sopenharmony_ci for (i = 0; i < qp->sq.max; ++i) { 12298c2ecf20Sopenharmony_ci next = get_send_wqe(qp, i); 12308c2ecf20Sopenharmony_ci next->nda_op = cpu_to_be32((((i + 1) & (qp->sq.max - 1)) << 12318c2ecf20Sopenharmony_ci qp->sq.wqe_shift) + 12328c2ecf20Sopenharmony_ci qp->send_wqe_offset); 12338c2ecf20Sopenharmony_ci } 12348c2ecf20Sopenharmony_ci } else { 12358c2ecf20Sopenharmony_ci for (i = 0; i < qp->rq.max; ++i) { 12368c2ecf20Sopenharmony_ci next = get_recv_wqe(qp, i); 12378c2ecf20Sopenharmony_ci next->nda_op = htonl((((i + 1) % qp->rq.max) << 12388c2ecf20Sopenharmony_ci qp->rq.wqe_shift) | 1); 12398c2ecf20Sopenharmony_ci } 12408c2ecf20Sopenharmony_ci 12418c2ecf20Sopenharmony_ci } 12428c2ecf20Sopenharmony_ci 12438c2ecf20Sopenharmony_ci qp->sq.last = get_send_wqe(qp, qp->sq.max - 1); 12448c2ecf20Sopenharmony_ci qp->rq.last = get_recv_wqe(qp, qp->rq.max - 1); 12458c2ecf20Sopenharmony_ci 12468c2ecf20Sopenharmony_ci return 0; 12478c2ecf20Sopenharmony_ci} 12488c2ecf20Sopenharmony_ci 12498c2ecf20Sopenharmony_cistatic int mthca_set_qp_size(struct mthca_dev *dev, struct ib_qp_cap *cap, 12508c2ecf20Sopenharmony_ci struct mthca_pd *pd, struct mthca_qp *qp) 12518c2ecf20Sopenharmony_ci{ 12528c2ecf20Sopenharmony_ci int max_data_size = mthca_max_data_size(dev, qp, dev->limits.max_desc_sz); 12538c2ecf20Sopenharmony_ci 12548c2ecf20Sopenharmony_ci /* Sanity check QP size before proceeding */ 12558c2ecf20Sopenharmony_ci if (cap->max_send_wr > dev->limits.max_wqes || 12568c2ecf20Sopenharmony_ci cap->max_recv_wr > dev->limits.max_wqes || 12578c2ecf20Sopenharmony_ci cap->max_send_sge > dev->limits.max_sg || 12588c2ecf20Sopenharmony_ci cap->max_recv_sge > dev->limits.max_sg || 12598c2ecf20Sopenharmony_ci cap->max_inline_data > mthca_max_inline_data(pd, max_data_size)) 12608c2ecf20Sopenharmony_ci return -EINVAL; 12618c2ecf20Sopenharmony_ci 12628c2ecf20Sopenharmony_ci /* 12638c2ecf20Sopenharmony_ci * For MLX transport we need 2 extra send gather entries: 12648c2ecf20Sopenharmony_ci * one for the header and one for the checksum at the end 12658c2ecf20Sopenharmony_ci */ 12668c2ecf20Sopenharmony_ci if (qp->transport == MLX && cap->max_send_sge + 2 > dev->limits.max_sg) 12678c2ecf20Sopenharmony_ci return -EINVAL; 12688c2ecf20Sopenharmony_ci 12698c2ecf20Sopenharmony_ci if (mthca_is_memfree(dev)) { 12708c2ecf20Sopenharmony_ci qp->rq.max = cap->max_recv_wr ? 12718c2ecf20Sopenharmony_ci roundup_pow_of_two(cap->max_recv_wr) : 0; 12728c2ecf20Sopenharmony_ci qp->sq.max = cap->max_send_wr ? 12738c2ecf20Sopenharmony_ci roundup_pow_of_two(cap->max_send_wr) : 0; 12748c2ecf20Sopenharmony_ci } else { 12758c2ecf20Sopenharmony_ci qp->rq.max = cap->max_recv_wr; 12768c2ecf20Sopenharmony_ci qp->sq.max = cap->max_send_wr; 12778c2ecf20Sopenharmony_ci } 12788c2ecf20Sopenharmony_ci 12798c2ecf20Sopenharmony_ci qp->rq.max_gs = cap->max_recv_sge; 12808c2ecf20Sopenharmony_ci qp->sq.max_gs = max_t(int, cap->max_send_sge, 12818c2ecf20Sopenharmony_ci ALIGN(cap->max_inline_data + MTHCA_INLINE_HEADER_SIZE, 12828c2ecf20Sopenharmony_ci MTHCA_INLINE_CHUNK_SIZE) / 12838c2ecf20Sopenharmony_ci sizeof (struct mthca_data_seg)); 12848c2ecf20Sopenharmony_ci 12858c2ecf20Sopenharmony_ci return 0; 12868c2ecf20Sopenharmony_ci} 12878c2ecf20Sopenharmony_ci 12888c2ecf20Sopenharmony_ciint mthca_alloc_qp(struct mthca_dev *dev, 12898c2ecf20Sopenharmony_ci struct mthca_pd *pd, 12908c2ecf20Sopenharmony_ci struct mthca_cq *send_cq, 12918c2ecf20Sopenharmony_ci struct mthca_cq *recv_cq, 12928c2ecf20Sopenharmony_ci enum ib_qp_type type, 12938c2ecf20Sopenharmony_ci enum ib_sig_type send_policy, 12948c2ecf20Sopenharmony_ci struct ib_qp_cap *cap, 12958c2ecf20Sopenharmony_ci struct mthca_qp *qp, 12968c2ecf20Sopenharmony_ci struct ib_udata *udata) 12978c2ecf20Sopenharmony_ci{ 12988c2ecf20Sopenharmony_ci int err; 12998c2ecf20Sopenharmony_ci 13008c2ecf20Sopenharmony_ci switch (type) { 13018c2ecf20Sopenharmony_ci case IB_QPT_RC: qp->transport = RC; break; 13028c2ecf20Sopenharmony_ci case IB_QPT_UC: qp->transport = UC; break; 13038c2ecf20Sopenharmony_ci case IB_QPT_UD: qp->transport = UD; break; 13048c2ecf20Sopenharmony_ci default: return -EINVAL; 13058c2ecf20Sopenharmony_ci } 13068c2ecf20Sopenharmony_ci 13078c2ecf20Sopenharmony_ci err = mthca_set_qp_size(dev, cap, pd, qp); 13088c2ecf20Sopenharmony_ci if (err) 13098c2ecf20Sopenharmony_ci return err; 13108c2ecf20Sopenharmony_ci 13118c2ecf20Sopenharmony_ci qp->qpn = mthca_alloc(&dev->qp_table.alloc); 13128c2ecf20Sopenharmony_ci if (qp->qpn == -1) 13138c2ecf20Sopenharmony_ci return -ENOMEM; 13148c2ecf20Sopenharmony_ci 13158c2ecf20Sopenharmony_ci /* initialize port to zero for error-catching. */ 13168c2ecf20Sopenharmony_ci qp->port = 0; 13178c2ecf20Sopenharmony_ci 13188c2ecf20Sopenharmony_ci err = mthca_alloc_qp_common(dev, pd, send_cq, recv_cq, 13198c2ecf20Sopenharmony_ci send_policy, qp, udata); 13208c2ecf20Sopenharmony_ci if (err) { 13218c2ecf20Sopenharmony_ci mthca_free(&dev->qp_table.alloc, qp->qpn); 13228c2ecf20Sopenharmony_ci return err; 13238c2ecf20Sopenharmony_ci } 13248c2ecf20Sopenharmony_ci 13258c2ecf20Sopenharmony_ci spin_lock_irq(&dev->qp_table.lock); 13268c2ecf20Sopenharmony_ci mthca_array_set(&dev->qp_table.qp, 13278c2ecf20Sopenharmony_ci qp->qpn & (dev->limits.num_qps - 1), qp); 13288c2ecf20Sopenharmony_ci spin_unlock_irq(&dev->qp_table.lock); 13298c2ecf20Sopenharmony_ci 13308c2ecf20Sopenharmony_ci return 0; 13318c2ecf20Sopenharmony_ci} 13328c2ecf20Sopenharmony_ci 13338c2ecf20Sopenharmony_cistatic void mthca_lock_cqs(struct mthca_cq *send_cq, struct mthca_cq *recv_cq) 13348c2ecf20Sopenharmony_ci __acquires(&send_cq->lock) __acquires(&recv_cq->lock) 13358c2ecf20Sopenharmony_ci{ 13368c2ecf20Sopenharmony_ci if (send_cq == recv_cq) { 13378c2ecf20Sopenharmony_ci spin_lock_irq(&send_cq->lock); 13388c2ecf20Sopenharmony_ci __acquire(&recv_cq->lock); 13398c2ecf20Sopenharmony_ci } else if (send_cq->cqn < recv_cq->cqn) { 13408c2ecf20Sopenharmony_ci spin_lock_irq(&send_cq->lock); 13418c2ecf20Sopenharmony_ci spin_lock_nested(&recv_cq->lock, SINGLE_DEPTH_NESTING); 13428c2ecf20Sopenharmony_ci } else { 13438c2ecf20Sopenharmony_ci spin_lock_irq(&recv_cq->lock); 13448c2ecf20Sopenharmony_ci spin_lock_nested(&send_cq->lock, SINGLE_DEPTH_NESTING); 13458c2ecf20Sopenharmony_ci } 13468c2ecf20Sopenharmony_ci} 13478c2ecf20Sopenharmony_ci 13488c2ecf20Sopenharmony_cistatic void mthca_unlock_cqs(struct mthca_cq *send_cq, struct mthca_cq *recv_cq) 13498c2ecf20Sopenharmony_ci __releases(&send_cq->lock) __releases(&recv_cq->lock) 13508c2ecf20Sopenharmony_ci{ 13518c2ecf20Sopenharmony_ci if (send_cq == recv_cq) { 13528c2ecf20Sopenharmony_ci __release(&recv_cq->lock); 13538c2ecf20Sopenharmony_ci spin_unlock_irq(&send_cq->lock); 13548c2ecf20Sopenharmony_ci } else if (send_cq->cqn < recv_cq->cqn) { 13558c2ecf20Sopenharmony_ci spin_unlock(&recv_cq->lock); 13568c2ecf20Sopenharmony_ci spin_unlock_irq(&send_cq->lock); 13578c2ecf20Sopenharmony_ci } else { 13588c2ecf20Sopenharmony_ci spin_unlock(&send_cq->lock); 13598c2ecf20Sopenharmony_ci spin_unlock_irq(&recv_cq->lock); 13608c2ecf20Sopenharmony_ci } 13618c2ecf20Sopenharmony_ci} 13628c2ecf20Sopenharmony_ci 13638c2ecf20Sopenharmony_ciint mthca_alloc_sqp(struct mthca_dev *dev, 13648c2ecf20Sopenharmony_ci struct mthca_pd *pd, 13658c2ecf20Sopenharmony_ci struct mthca_cq *send_cq, 13668c2ecf20Sopenharmony_ci struct mthca_cq *recv_cq, 13678c2ecf20Sopenharmony_ci enum ib_sig_type send_policy, 13688c2ecf20Sopenharmony_ci struct ib_qp_cap *cap, 13698c2ecf20Sopenharmony_ci int qpn, 13708c2ecf20Sopenharmony_ci int port, 13718c2ecf20Sopenharmony_ci struct mthca_qp *qp, 13728c2ecf20Sopenharmony_ci struct ib_udata *udata) 13738c2ecf20Sopenharmony_ci{ 13748c2ecf20Sopenharmony_ci u32 mqpn = qpn * 2 + dev->qp_table.sqp_start + port - 1; 13758c2ecf20Sopenharmony_ci int err; 13768c2ecf20Sopenharmony_ci 13778c2ecf20Sopenharmony_ci qp->transport = MLX; 13788c2ecf20Sopenharmony_ci err = mthca_set_qp_size(dev, cap, pd, qp); 13798c2ecf20Sopenharmony_ci if (err) 13808c2ecf20Sopenharmony_ci return err; 13818c2ecf20Sopenharmony_ci 13828c2ecf20Sopenharmony_ci qp->sqp->header_buf_size = qp->sq.max * MTHCA_UD_HEADER_SIZE; 13838c2ecf20Sopenharmony_ci qp->sqp->header_buf = 13848c2ecf20Sopenharmony_ci dma_alloc_coherent(&dev->pdev->dev, qp->sqp->header_buf_size, 13858c2ecf20Sopenharmony_ci &qp->sqp->header_dma, GFP_KERNEL); 13868c2ecf20Sopenharmony_ci if (!qp->sqp->header_buf) 13878c2ecf20Sopenharmony_ci return -ENOMEM; 13888c2ecf20Sopenharmony_ci 13898c2ecf20Sopenharmony_ci spin_lock_irq(&dev->qp_table.lock); 13908c2ecf20Sopenharmony_ci if (mthca_array_get(&dev->qp_table.qp, mqpn)) 13918c2ecf20Sopenharmony_ci err = -EBUSY; 13928c2ecf20Sopenharmony_ci else 13938c2ecf20Sopenharmony_ci mthca_array_set(&dev->qp_table.qp, mqpn, qp); 13948c2ecf20Sopenharmony_ci spin_unlock_irq(&dev->qp_table.lock); 13958c2ecf20Sopenharmony_ci 13968c2ecf20Sopenharmony_ci if (err) 13978c2ecf20Sopenharmony_ci goto err_out; 13988c2ecf20Sopenharmony_ci 13998c2ecf20Sopenharmony_ci qp->port = port; 14008c2ecf20Sopenharmony_ci qp->qpn = mqpn; 14018c2ecf20Sopenharmony_ci qp->transport = MLX; 14028c2ecf20Sopenharmony_ci 14038c2ecf20Sopenharmony_ci err = mthca_alloc_qp_common(dev, pd, send_cq, recv_cq, 14048c2ecf20Sopenharmony_ci send_policy, qp, udata); 14058c2ecf20Sopenharmony_ci if (err) 14068c2ecf20Sopenharmony_ci goto err_out_free; 14078c2ecf20Sopenharmony_ci 14088c2ecf20Sopenharmony_ci atomic_inc(&pd->sqp_count); 14098c2ecf20Sopenharmony_ci 14108c2ecf20Sopenharmony_ci return 0; 14118c2ecf20Sopenharmony_ci 14128c2ecf20Sopenharmony_ci err_out_free: 14138c2ecf20Sopenharmony_ci /* 14148c2ecf20Sopenharmony_ci * Lock CQs here, so that CQ polling code can do QP lookup 14158c2ecf20Sopenharmony_ci * without taking a lock. 14168c2ecf20Sopenharmony_ci */ 14178c2ecf20Sopenharmony_ci mthca_lock_cqs(send_cq, recv_cq); 14188c2ecf20Sopenharmony_ci 14198c2ecf20Sopenharmony_ci spin_lock(&dev->qp_table.lock); 14208c2ecf20Sopenharmony_ci mthca_array_clear(&dev->qp_table.qp, mqpn); 14218c2ecf20Sopenharmony_ci spin_unlock(&dev->qp_table.lock); 14228c2ecf20Sopenharmony_ci 14238c2ecf20Sopenharmony_ci mthca_unlock_cqs(send_cq, recv_cq); 14248c2ecf20Sopenharmony_ci 14258c2ecf20Sopenharmony_cierr_out: 14268c2ecf20Sopenharmony_ci dma_free_coherent(&dev->pdev->dev, qp->sqp->header_buf_size, 14278c2ecf20Sopenharmony_ci qp->sqp->header_buf, qp->sqp->header_dma); 14288c2ecf20Sopenharmony_ci return err; 14298c2ecf20Sopenharmony_ci} 14308c2ecf20Sopenharmony_ci 14318c2ecf20Sopenharmony_cistatic inline int get_qp_refcount(struct mthca_dev *dev, struct mthca_qp *qp) 14328c2ecf20Sopenharmony_ci{ 14338c2ecf20Sopenharmony_ci int c; 14348c2ecf20Sopenharmony_ci 14358c2ecf20Sopenharmony_ci spin_lock_irq(&dev->qp_table.lock); 14368c2ecf20Sopenharmony_ci c = qp->refcount; 14378c2ecf20Sopenharmony_ci spin_unlock_irq(&dev->qp_table.lock); 14388c2ecf20Sopenharmony_ci 14398c2ecf20Sopenharmony_ci return c; 14408c2ecf20Sopenharmony_ci} 14418c2ecf20Sopenharmony_ci 14428c2ecf20Sopenharmony_civoid mthca_free_qp(struct mthca_dev *dev, 14438c2ecf20Sopenharmony_ci struct mthca_qp *qp) 14448c2ecf20Sopenharmony_ci{ 14458c2ecf20Sopenharmony_ci struct mthca_cq *send_cq; 14468c2ecf20Sopenharmony_ci struct mthca_cq *recv_cq; 14478c2ecf20Sopenharmony_ci 14488c2ecf20Sopenharmony_ci send_cq = to_mcq(qp->ibqp.send_cq); 14498c2ecf20Sopenharmony_ci recv_cq = to_mcq(qp->ibqp.recv_cq); 14508c2ecf20Sopenharmony_ci 14518c2ecf20Sopenharmony_ci /* 14528c2ecf20Sopenharmony_ci * Lock CQs here, so that CQ polling code can do QP lookup 14538c2ecf20Sopenharmony_ci * without taking a lock. 14548c2ecf20Sopenharmony_ci */ 14558c2ecf20Sopenharmony_ci mthca_lock_cqs(send_cq, recv_cq); 14568c2ecf20Sopenharmony_ci 14578c2ecf20Sopenharmony_ci spin_lock(&dev->qp_table.lock); 14588c2ecf20Sopenharmony_ci mthca_array_clear(&dev->qp_table.qp, 14598c2ecf20Sopenharmony_ci qp->qpn & (dev->limits.num_qps - 1)); 14608c2ecf20Sopenharmony_ci --qp->refcount; 14618c2ecf20Sopenharmony_ci spin_unlock(&dev->qp_table.lock); 14628c2ecf20Sopenharmony_ci 14638c2ecf20Sopenharmony_ci mthca_unlock_cqs(send_cq, recv_cq); 14648c2ecf20Sopenharmony_ci 14658c2ecf20Sopenharmony_ci wait_event(qp->wait, !get_qp_refcount(dev, qp)); 14668c2ecf20Sopenharmony_ci 14678c2ecf20Sopenharmony_ci if (qp->state != IB_QPS_RESET) 14688c2ecf20Sopenharmony_ci mthca_MODIFY_QP(dev, qp->state, IB_QPS_RESET, qp->qpn, 0, 14698c2ecf20Sopenharmony_ci NULL, 0); 14708c2ecf20Sopenharmony_ci 14718c2ecf20Sopenharmony_ci /* 14728c2ecf20Sopenharmony_ci * If this is a userspace QP, the buffers, MR, CQs and so on 14738c2ecf20Sopenharmony_ci * will be cleaned up in userspace, so all we have to do is 14748c2ecf20Sopenharmony_ci * unref the mem-free tables and free the QPN in our table. 14758c2ecf20Sopenharmony_ci */ 14768c2ecf20Sopenharmony_ci if (!qp->ibqp.uobject) { 14778c2ecf20Sopenharmony_ci mthca_cq_clean(dev, recv_cq, qp->qpn, 14788c2ecf20Sopenharmony_ci qp->ibqp.srq ? to_msrq(qp->ibqp.srq) : NULL); 14798c2ecf20Sopenharmony_ci if (send_cq != recv_cq) 14808c2ecf20Sopenharmony_ci mthca_cq_clean(dev, send_cq, qp->qpn, NULL); 14818c2ecf20Sopenharmony_ci 14828c2ecf20Sopenharmony_ci mthca_free_memfree(dev, qp); 14838c2ecf20Sopenharmony_ci mthca_free_wqe_buf(dev, qp); 14848c2ecf20Sopenharmony_ci } 14858c2ecf20Sopenharmony_ci 14868c2ecf20Sopenharmony_ci mthca_unmap_memfree(dev, qp); 14878c2ecf20Sopenharmony_ci 14888c2ecf20Sopenharmony_ci if (is_sqp(dev, qp)) { 14898c2ecf20Sopenharmony_ci atomic_dec(&(to_mpd(qp->ibqp.pd)->sqp_count)); 14908c2ecf20Sopenharmony_ci dma_free_coherent(&dev->pdev->dev, qp->sqp->header_buf_size, 14918c2ecf20Sopenharmony_ci qp->sqp->header_buf, qp->sqp->header_dma); 14928c2ecf20Sopenharmony_ci } else 14938c2ecf20Sopenharmony_ci mthca_free(&dev->qp_table.alloc, qp->qpn); 14948c2ecf20Sopenharmony_ci} 14958c2ecf20Sopenharmony_ci 14968c2ecf20Sopenharmony_ci/* Create UD header for an MLX send and build a data segment for it */ 14978c2ecf20Sopenharmony_cistatic int build_mlx_header(struct mthca_dev *dev, struct mthca_qp *qp, int ind, 14988c2ecf20Sopenharmony_ci const struct ib_ud_wr *wr, 14998c2ecf20Sopenharmony_ci struct mthca_mlx_seg *mlx, 15008c2ecf20Sopenharmony_ci struct mthca_data_seg *data) 15018c2ecf20Sopenharmony_ci{ 15028c2ecf20Sopenharmony_ci struct mthca_sqp *sqp = qp->sqp; 15038c2ecf20Sopenharmony_ci int header_size; 15048c2ecf20Sopenharmony_ci int err; 15058c2ecf20Sopenharmony_ci u16 pkey; 15068c2ecf20Sopenharmony_ci 15078c2ecf20Sopenharmony_ci ib_ud_header_init(256, /* assume a MAD */ 1, 0, 0, 15088c2ecf20Sopenharmony_ci mthca_ah_grh_present(to_mah(wr->ah)), 0, 0, 0, 15098c2ecf20Sopenharmony_ci &sqp->ud_header); 15108c2ecf20Sopenharmony_ci 15118c2ecf20Sopenharmony_ci err = mthca_read_ah(dev, to_mah(wr->ah), &sqp->ud_header); 15128c2ecf20Sopenharmony_ci if (err) 15138c2ecf20Sopenharmony_ci return err; 15148c2ecf20Sopenharmony_ci mlx->flags &= ~cpu_to_be32(MTHCA_NEXT_SOLICIT | 1); 15158c2ecf20Sopenharmony_ci mlx->flags |= cpu_to_be32((!qp->ibqp.qp_num ? MTHCA_MLX_VL15 : 0) | 15168c2ecf20Sopenharmony_ci (sqp->ud_header.lrh.destination_lid == 15178c2ecf20Sopenharmony_ci IB_LID_PERMISSIVE ? MTHCA_MLX_SLR : 0) | 15188c2ecf20Sopenharmony_ci (sqp->ud_header.lrh.service_level << 8)); 15198c2ecf20Sopenharmony_ci mlx->rlid = sqp->ud_header.lrh.destination_lid; 15208c2ecf20Sopenharmony_ci mlx->vcrc = 0; 15218c2ecf20Sopenharmony_ci 15228c2ecf20Sopenharmony_ci switch (wr->wr.opcode) { 15238c2ecf20Sopenharmony_ci case IB_WR_SEND: 15248c2ecf20Sopenharmony_ci sqp->ud_header.bth.opcode = IB_OPCODE_UD_SEND_ONLY; 15258c2ecf20Sopenharmony_ci sqp->ud_header.immediate_present = 0; 15268c2ecf20Sopenharmony_ci break; 15278c2ecf20Sopenharmony_ci case IB_WR_SEND_WITH_IMM: 15288c2ecf20Sopenharmony_ci sqp->ud_header.bth.opcode = IB_OPCODE_UD_SEND_ONLY_WITH_IMMEDIATE; 15298c2ecf20Sopenharmony_ci sqp->ud_header.immediate_present = 1; 15308c2ecf20Sopenharmony_ci sqp->ud_header.immediate_data = wr->wr.ex.imm_data; 15318c2ecf20Sopenharmony_ci break; 15328c2ecf20Sopenharmony_ci default: 15338c2ecf20Sopenharmony_ci return -EINVAL; 15348c2ecf20Sopenharmony_ci } 15358c2ecf20Sopenharmony_ci 15368c2ecf20Sopenharmony_ci sqp->ud_header.lrh.virtual_lane = !qp->ibqp.qp_num ? 15 : 0; 15378c2ecf20Sopenharmony_ci if (sqp->ud_header.lrh.destination_lid == IB_LID_PERMISSIVE) 15388c2ecf20Sopenharmony_ci sqp->ud_header.lrh.source_lid = IB_LID_PERMISSIVE; 15398c2ecf20Sopenharmony_ci sqp->ud_header.bth.solicited_event = !!(wr->wr.send_flags & IB_SEND_SOLICITED); 15408c2ecf20Sopenharmony_ci if (!qp->ibqp.qp_num) 15418c2ecf20Sopenharmony_ci ib_get_cached_pkey(&dev->ib_dev, qp->port, sqp->pkey_index, 15428c2ecf20Sopenharmony_ci &pkey); 15438c2ecf20Sopenharmony_ci else 15448c2ecf20Sopenharmony_ci ib_get_cached_pkey(&dev->ib_dev, qp->port, wr->pkey_index, 15458c2ecf20Sopenharmony_ci &pkey); 15468c2ecf20Sopenharmony_ci sqp->ud_header.bth.pkey = cpu_to_be16(pkey); 15478c2ecf20Sopenharmony_ci sqp->ud_header.bth.destination_qpn = cpu_to_be32(wr->remote_qpn); 15488c2ecf20Sopenharmony_ci sqp->ud_header.bth.psn = cpu_to_be32((sqp->send_psn++) & ((1 << 24) - 1)); 15498c2ecf20Sopenharmony_ci sqp->ud_header.deth.qkey = cpu_to_be32(wr->remote_qkey & 0x80000000 ? 15508c2ecf20Sopenharmony_ci sqp->qkey : wr->remote_qkey); 15518c2ecf20Sopenharmony_ci sqp->ud_header.deth.source_qpn = cpu_to_be32(qp->ibqp.qp_num); 15528c2ecf20Sopenharmony_ci 15538c2ecf20Sopenharmony_ci header_size = ib_ud_header_pack(&sqp->ud_header, 15548c2ecf20Sopenharmony_ci sqp->header_buf + 15558c2ecf20Sopenharmony_ci ind * MTHCA_UD_HEADER_SIZE); 15568c2ecf20Sopenharmony_ci 15578c2ecf20Sopenharmony_ci data->byte_count = cpu_to_be32(header_size); 15588c2ecf20Sopenharmony_ci data->lkey = cpu_to_be32(to_mpd(qp->ibqp.pd)->ntmr.ibmr.lkey); 15598c2ecf20Sopenharmony_ci data->addr = cpu_to_be64(sqp->header_dma + 15608c2ecf20Sopenharmony_ci ind * MTHCA_UD_HEADER_SIZE); 15618c2ecf20Sopenharmony_ci 15628c2ecf20Sopenharmony_ci return 0; 15638c2ecf20Sopenharmony_ci} 15648c2ecf20Sopenharmony_ci 15658c2ecf20Sopenharmony_cistatic inline int mthca_wq_overflow(struct mthca_wq *wq, int nreq, 15668c2ecf20Sopenharmony_ci struct ib_cq *ib_cq) 15678c2ecf20Sopenharmony_ci{ 15688c2ecf20Sopenharmony_ci unsigned cur; 15698c2ecf20Sopenharmony_ci struct mthca_cq *cq; 15708c2ecf20Sopenharmony_ci 15718c2ecf20Sopenharmony_ci cur = wq->head - wq->tail; 15728c2ecf20Sopenharmony_ci if (likely(cur + nreq < wq->max)) 15738c2ecf20Sopenharmony_ci return 0; 15748c2ecf20Sopenharmony_ci 15758c2ecf20Sopenharmony_ci cq = to_mcq(ib_cq); 15768c2ecf20Sopenharmony_ci spin_lock(&cq->lock); 15778c2ecf20Sopenharmony_ci cur = wq->head - wq->tail; 15788c2ecf20Sopenharmony_ci spin_unlock(&cq->lock); 15798c2ecf20Sopenharmony_ci 15808c2ecf20Sopenharmony_ci return cur + nreq >= wq->max; 15818c2ecf20Sopenharmony_ci} 15828c2ecf20Sopenharmony_ci 15838c2ecf20Sopenharmony_cistatic __always_inline void set_raddr_seg(struct mthca_raddr_seg *rseg, 15848c2ecf20Sopenharmony_ci u64 remote_addr, u32 rkey) 15858c2ecf20Sopenharmony_ci{ 15868c2ecf20Sopenharmony_ci rseg->raddr = cpu_to_be64(remote_addr); 15878c2ecf20Sopenharmony_ci rseg->rkey = cpu_to_be32(rkey); 15888c2ecf20Sopenharmony_ci rseg->reserved = 0; 15898c2ecf20Sopenharmony_ci} 15908c2ecf20Sopenharmony_ci 15918c2ecf20Sopenharmony_cistatic __always_inline void set_atomic_seg(struct mthca_atomic_seg *aseg, 15928c2ecf20Sopenharmony_ci const struct ib_atomic_wr *wr) 15938c2ecf20Sopenharmony_ci{ 15948c2ecf20Sopenharmony_ci if (wr->wr.opcode == IB_WR_ATOMIC_CMP_AND_SWP) { 15958c2ecf20Sopenharmony_ci aseg->swap_add = cpu_to_be64(wr->swap); 15968c2ecf20Sopenharmony_ci aseg->compare = cpu_to_be64(wr->compare_add); 15978c2ecf20Sopenharmony_ci } else { 15988c2ecf20Sopenharmony_ci aseg->swap_add = cpu_to_be64(wr->compare_add); 15998c2ecf20Sopenharmony_ci aseg->compare = 0; 16008c2ecf20Sopenharmony_ci } 16018c2ecf20Sopenharmony_ci 16028c2ecf20Sopenharmony_ci} 16038c2ecf20Sopenharmony_ci 16048c2ecf20Sopenharmony_cistatic void set_tavor_ud_seg(struct mthca_tavor_ud_seg *useg, 16058c2ecf20Sopenharmony_ci const struct ib_ud_wr *wr) 16068c2ecf20Sopenharmony_ci{ 16078c2ecf20Sopenharmony_ci useg->lkey = cpu_to_be32(to_mah(wr->ah)->key); 16088c2ecf20Sopenharmony_ci useg->av_addr = cpu_to_be64(to_mah(wr->ah)->avdma); 16098c2ecf20Sopenharmony_ci useg->dqpn = cpu_to_be32(wr->remote_qpn); 16108c2ecf20Sopenharmony_ci useg->qkey = cpu_to_be32(wr->remote_qkey); 16118c2ecf20Sopenharmony_ci 16128c2ecf20Sopenharmony_ci} 16138c2ecf20Sopenharmony_ci 16148c2ecf20Sopenharmony_cistatic void set_arbel_ud_seg(struct mthca_arbel_ud_seg *useg, 16158c2ecf20Sopenharmony_ci const struct ib_ud_wr *wr) 16168c2ecf20Sopenharmony_ci{ 16178c2ecf20Sopenharmony_ci memcpy(useg->av, to_mah(wr->ah)->av, MTHCA_AV_SIZE); 16188c2ecf20Sopenharmony_ci useg->dqpn = cpu_to_be32(wr->remote_qpn); 16198c2ecf20Sopenharmony_ci useg->qkey = cpu_to_be32(wr->remote_qkey); 16208c2ecf20Sopenharmony_ci} 16218c2ecf20Sopenharmony_ci 16228c2ecf20Sopenharmony_ciint mthca_tavor_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr, 16238c2ecf20Sopenharmony_ci const struct ib_send_wr **bad_wr) 16248c2ecf20Sopenharmony_ci{ 16258c2ecf20Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 16268c2ecf20Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 16278c2ecf20Sopenharmony_ci void *wqe; 16288c2ecf20Sopenharmony_ci void *prev_wqe; 16298c2ecf20Sopenharmony_ci unsigned long flags; 16308c2ecf20Sopenharmony_ci int err = 0; 16318c2ecf20Sopenharmony_ci int nreq; 16328c2ecf20Sopenharmony_ci int i; 16338c2ecf20Sopenharmony_ci int size; 16348c2ecf20Sopenharmony_ci /* 16358c2ecf20Sopenharmony_ci * f0 and size0 are only used if nreq != 0, and they will 16368c2ecf20Sopenharmony_ci * always be initialized the first time through the main loop 16378c2ecf20Sopenharmony_ci * before nreq is incremented. So nreq cannot become non-zero 16388c2ecf20Sopenharmony_ci * without initializing f0 and size0, and they are in fact 16398c2ecf20Sopenharmony_ci * never used uninitialized. 16408c2ecf20Sopenharmony_ci */ 16418c2ecf20Sopenharmony_ci int size0; 16428c2ecf20Sopenharmony_ci u32 f0; 16438c2ecf20Sopenharmony_ci int ind; 16448c2ecf20Sopenharmony_ci u8 op0 = 0; 16458c2ecf20Sopenharmony_ci 16468c2ecf20Sopenharmony_ci spin_lock_irqsave(&qp->sq.lock, flags); 16478c2ecf20Sopenharmony_ci 16488c2ecf20Sopenharmony_ci /* XXX check that state is OK to post send */ 16498c2ecf20Sopenharmony_ci 16508c2ecf20Sopenharmony_ci ind = qp->sq.next_ind; 16518c2ecf20Sopenharmony_ci 16528c2ecf20Sopenharmony_ci for (nreq = 0; wr; ++nreq, wr = wr->next) { 16538c2ecf20Sopenharmony_ci if (mthca_wq_overflow(&qp->sq, nreq, qp->ibqp.send_cq)) { 16548c2ecf20Sopenharmony_ci mthca_err(dev, "SQ %06x full (%u head, %u tail," 16558c2ecf20Sopenharmony_ci " %d max, %d nreq)\n", qp->qpn, 16568c2ecf20Sopenharmony_ci qp->sq.head, qp->sq.tail, 16578c2ecf20Sopenharmony_ci qp->sq.max, nreq); 16588c2ecf20Sopenharmony_ci err = -ENOMEM; 16598c2ecf20Sopenharmony_ci *bad_wr = wr; 16608c2ecf20Sopenharmony_ci goto out; 16618c2ecf20Sopenharmony_ci } 16628c2ecf20Sopenharmony_ci 16638c2ecf20Sopenharmony_ci wqe = get_send_wqe(qp, ind); 16648c2ecf20Sopenharmony_ci prev_wqe = qp->sq.last; 16658c2ecf20Sopenharmony_ci qp->sq.last = wqe; 16668c2ecf20Sopenharmony_ci 16678c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) wqe)->nda_op = 0; 16688c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) wqe)->ee_nds = 0; 16698c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) wqe)->flags = 16708c2ecf20Sopenharmony_ci ((wr->send_flags & IB_SEND_SIGNALED) ? 16718c2ecf20Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_CQ_UPDATE) : 0) | 16728c2ecf20Sopenharmony_ci ((wr->send_flags & IB_SEND_SOLICITED) ? 16738c2ecf20Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_SOLICIT) : 0) | 16748c2ecf20Sopenharmony_ci cpu_to_be32(1); 16758c2ecf20Sopenharmony_ci if (wr->opcode == IB_WR_SEND_WITH_IMM || 16768c2ecf20Sopenharmony_ci wr->opcode == IB_WR_RDMA_WRITE_WITH_IMM) 16778c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) wqe)->imm = wr->ex.imm_data; 16788c2ecf20Sopenharmony_ci 16798c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_next_seg); 16808c2ecf20Sopenharmony_ci size = sizeof (struct mthca_next_seg) / 16; 16818c2ecf20Sopenharmony_ci 16828c2ecf20Sopenharmony_ci switch (qp->transport) { 16838c2ecf20Sopenharmony_ci case RC: 16848c2ecf20Sopenharmony_ci switch (wr->opcode) { 16858c2ecf20Sopenharmony_ci case IB_WR_ATOMIC_CMP_AND_SWP: 16868c2ecf20Sopenharmony_ci case IB_WR_ATOMIC_FETCH_AND_ADD: 16878c2ecf20Sopenharmony_ci set_raddr_seg(wqe, atomic_wr(wr)->remote_addr, 16888c2ecf20Sopenharmony_ci atomic_wr(wr)->rkey); 16898c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 16908c2ecf20Sopenharmony_ci 16918c2ecf20Sopenharmony_ci set_atomic_seg(wqe, atomic_wr(wr)); 16928c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_atomic_seg); 16938c2ecf20Sopenharmony_ci size += (sizeof (struct mthca_raddr_seg) + 16948c2ecf20Sopenharmony_ci sizeof (struct mthca_atomic_seg)) / 16; 16958c2ecf20Sopenharmony_ci break; 16968c2ecf20Sopenharmony_ci 16978c2ecf20Sopenharmony_ci case IB_WR_RDMA_WRITE: 16988c2ecf20Sopenharmony_ci case IB_WR_RDMA_WRITE_WITH_IMM: 16998c2ecf20Sopenharmony_ci case IB_WR_RDMA_READ: 17008c2ecf20Sopenharmony_ci set_raddr_seg(wqe, rdma_wr(wr)->remote_addr, 17018c2ecf20Sopenharmony_ci rdma_wr(wr)->rkey); 17028c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 17038c2ecf20Sopenharmony_ci size += sizeof (struct mthca_raddr_seg) / 16; 17048c2ecf20Sopenharmony_ci break; 17058c2ecf20Sopenharmony_ci 17068c2ecf20Sopenharmony_ci default: 17078c2ecf20Sopenharmony_ci /* No extra segments required for sends */ 17088c2ecf20Sopenharmony_ci break; 17098c2ecf20Sopenharmony_ci } 17108c2ecf20Sopenharmony_ci 17118c2ecf20Sopenharmony_ci break; 17128c2ecf20Sopenharmony_ci 17138c2ecf20Sopenharmony_ci case UC: 17148c2ecf20Sopenharmony_ci switch (wr->opcode) { 17158c2ecf20Sopenharmony_ci case IB_WR_RDMA_WRITE: 17168c2ecf20Sopenharmony_ci case IB_WR_RDMA_WRITE_WITH_IMM: 17178c2ecf20Sopenharmony_ci set_raddr_seg(wqe, rdma_wr(wr)->remote_addr, 17188c2ecf20Sopenharmony_ci rdma_wr(wr)->rkey); 17198c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 17208c2ecf20Sopenharmony_ci size += sizeof (struct mthca_raddr_seg) / 16; 17218c2ecf20Sopenharmony_ci break; 17228c2ecf20Sopenharmony_ci 17238c2ecf20Sopenharmony_ci default: 17248c2ecf20Sopenharmony_ci /* No extra segments required for sends */ 17258c2ecf20Sopenharmony_ci break; 17268c2ecf20Sopenharmony_ci } 17278c2ecf20Sopenharmony_ci 17288c2ecf20Sopenharmony_ci break; 17298c2ecf20Sopenharmony_ci 17308c2ecf20Sopenharmony_ci case UD: 17318c2ecf20Sopenharmony_ci set_tavor_ud_seg(wqe, ud_wr(wr)); 17328c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_tavor_ud_seg); 17338c2ecf20Sopenharmony_ci size += sizeof (struct mthca_tavor_ud_seg) / 16; 17348c2ecf20Sopenharmony_ci break; 17358c2ecf20Sopenharmony_ci 17368c2ecf20Sopenharmony_ci case MLX: 17378c2ecf20Sopenharmony_ci err = build_mlx_header( 17388c2ecf20Sopenharmony_ci dev, qp, ind, ud_wr(wr), 17398c2ecf20Sopenharmony_ci wqe - sizeof(struct mthca_next_seg), wqe); 17408c2ecf20Sopenharmony_ci if (err) { 17418c2ecf20Sopenharmony_ci *bad_wr = wr; 17428c2ecf20Sopenharmony_ci goto out; 17438c2ecf20Sopenharmony_ci } 17448c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 17458c2ecf20Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 17468c2ecf20Sopenharmony_ci break; 17478c2ecf20Sopenharmony_ci } 17488c2ecf20Sopenharmony_ci 17498c2ecf20Sopenharmony_ci if (wr->num_sge > qp->sq.max_gs) { 17508c2ecf20Sopenharmony_ci mthca_err(dev, "too many gathers\n"); 17518c2ecf20Sopenharmony_ci err = -EINVAL; 17528c2ecf20Sopenharmony_ci *bad_wr = wr; 17538c2ecf20Sopenharmony_ci goto out; 17548c2ecf20Sopenharmony_ci } 17558c2ecf20Sopenharmony_ci 17568c2ecf20Sopenharmony_ci for (i = 0; i < wr->num_sge; ++i) { 17578c2ecf20Sopenharmony_ci mthca_set_data_seg(wqe, wr->sg_list + i); 17588c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 17598c2ecf20Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 17608c2ecf20Sopenharmony_ci } 17618c2ecf20Sopenharmony_ci 17628c2ecf20Sopenharmony_ci /* Add one more inline data segment for ICRC */ 17638c2ecf20Sopenharmony_ci if (qp->transport == MLX) { 17648c2ecf20Sopenharmony_ci ((struct mthca_data_seg *) wqe)->byte_count = 17658c2ecf20Sopenharmony_ci cpu_to_be32((1 << 31) | 4); 17668c2ecf20Sopenharmony_ci ((u32 *) wqe)[1] = 0; 17678c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 17688c2ecf20Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 17698c2ecf20Sopenharmony_ci } 17708c2ecf20Sopenharmony_ci 17718c2ecf20Sopenharmony_ci qp->wrid[ind + qp->rq.max] = wr->wr_id; 17728c2ecf20Sopenharmony_ci 17738c2ecf20Sopenharmony_ci if (wr->opcode >= ARRAY_SIZE(mthca_opcode)) { 17748c2ecf20Sopenharmony_ci mthca_err(dev, "opcode invalid\n"); 17758c2ecf20Sopenharmony_ci err = -EINVAL; 17768c2ecf20Sopenharmony_ci *bad_wr = wr; 17778c2ecf20Sopenharmony_ci goto out; 17788c2ecf20Sopenharmony_ci } 17798c2ecf20Sopenharmony_ci 17808c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) prev_wqe)->nda_op = 17818c2ecf20Sopenharmony_ci cpu_to_be32(((ind << qp->sq.wqe_shift) + 17828c2ecf20Sopenharmony_ci qp->send_wqe_offset) | 17838c2ecf20Sopenharmony_ci mthca_opcode[wr->opcode]); 17848c2ecf20Sopenharmony_ci wmb(); 17858c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) prev_wqe)->ee_nds = 17868c2ecf20Sopenharmony_ci cpu_to_be32((nreq ? 0 : MTHCA_NEXT_DBD) | size | 17878c2ecf20Sopenharmony_ci ((wr->send_flags & IB_SEND_FENCE) ? 17888c2ecf20Sopenharmony_ci MTHCA_NEXT_FENCE : 0)); 17898c2ecf20Sopenharmony_ci 17908c2ecf20Sopenharmony_ci if (!nreq) { 17918c2ecf20Sopenharmony_ci size0 = size; 17928c2ecf20Sopenharmony_ci op0 = mthca_opcode[wr->opcode]; 17938c2ecf20Sopenharmony_ci f0 = wr->send_flags & IB_SEND_FENCE ? 17948c2ecf20Sopenharmony_ci MTHCA_SEND_DOORBELL_FENCE : 0; 17958c2ecf20Sopenharmony_ci } 17968c2ecf20Sopenharmony_ci 17978c2ecf20Sopenharmony_ci ++ind; 17988c2ecf20Sopenharmony_ci if (unlikely(ind >= qp->sq.max)) 17998c2ecf20Sopenharmony_ci ind -= qp->sq.max; 18008c2ecf20Sopenharmony_ci } 18018c2ecf20Sopenharmony_ci 18028c2ecf20Sopenharmony_ciout: 18038c2ecf20Sopenharmony_ci if (likely(nreq)) { 18048c2ecf20Sopenharmony_ci wmb(); 18058c2ecf20Sopenharmony_ci 18068c2ecf20Sopenharmony_ci mthca_write64(((qp->sq.next_ind << qp->sq.wqe_shift) + 18078c2ecf20Sopenharmony_ci qp->send_wqe_offset) | f0 | op0, 18088c2ecf20Sopenharmony_ci (qp->qpn << 8) | size0, 18098c2ecf20Sopenharmony_ci dev->kar + MTHCA_SEND_DOORBELL, 18108c2ecf20Sopenharmony_ci MTHCA_GET_DOORBELL_LOCK(&dev->doorbell_lock)); 18118c2ecf20Sopenharmony_ci } 18128c2ecf20Sopenharmony_ci 18138c2ecf20Sopenharmony_ci qp->sq.next_ind = ind; 18148c2ecf20Sopenharmony_ci qp->sq.head += nreq; 18158c2ecf20Sopenharmony_ci 18168c2ecf20Sopenharmony_ci spin_unlock_irqrestore(&qp->sq.lock, flags); 18178c2ecf20Sopenharmony_ci return err; 18188c2ecf20Sopenharmony_ci} 18198c2ecf20Sopenharmony_ci 18208c2ecf20Sopenharmony_ciint mthca_tavor_post_receive(struct ib_qp *ibqp, const struct ib_recv_wr *wr, 18218c2ecf20Sopenharmony_ci const struct ib_recv_wr **bad_wr) 18228c2ecf20Sopenharmony_ci{ 18238c2ecf20Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 18248c2ecf20Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 18258c2ecf20Sopenharmony_ci unsigned long flags; 18268c2ecf20Sopenharmony_ci int err = 0; 18278c2ecf20Sopenharmony_ci int nreq; 18288c2ecf20Sopenharmony_ci int i; 18298c2ecf20Sopenharmony_ci int size; 18308c2ecf20Sopenharmony_ci /* 18318c2ecf20Sopenharmony_ci * size0 is only used if nreq != 0, and it will always be 18328c2ecf20Sopenharmony_ci * initialized the first time through the main loop before 18338c2ecf20Sopenharmony_ci * nreq is incremented. So nreq cannot become non-zero 18348c2ecf20Sopenharmony_ci * without initializing size0, and it is in fact never used 18358c2ecf20Sopenharmony_ci * uninitialized. 18368c2ecf20Sopenharmony_ci */ 18378c2ecf20Sopenharmony_ci int size0; 18388c2ecf20Sopenharmony_ci int ind; 18398c2ecf20Sopenharmony_ci void *wqe; 18408c2ecf20Sopenharmony_ci void *prev_wqe; 18418c2ecf20Sopenharmony_ci 18428c2ecf20Sopenharmony_ci spin_lock_irqsave(&qp->rq.lock, flags); 18438c2ecf20Sopenharmony_ci 18448c2ecf20Sopenharmony_ci /* XXX check that state is OK to post receive */ 18458c2ecf20Sopenharmony_ci 18468c2ecf20Sopenharmony_ci ind = qp->rq.next_ind; 18478c2ecf20Sopenharmony_ci 18488c2ecf20Sopenharmony_ci for (nreq = 0; wr; wr = wr->next) { 18498c2ecf20Sopenharmony_ci if (mthca_wq_overflow(&qp->rq, nreq, qp->ibqp.recv_cq)) { 18508c2ecf20Sopenharmony_ci mthca_err(dev, "RQ %06x full (%u head, %u tail," 18518c2ecf20Sopenharmony_ci " %d max, %d nreq)\n", qp->qpn, 18528c2ecf20Sopenharmony_ci qp->rq.head, qp->rq.tail, 18538c2ecf20Sopenharmony_ci qp->rq.max, nreq); 18548c2ecf20Sopenharmony_ci err = -ENOMEM; 18558c2ecf20Sopenharmony_ci *bad_wr = wr; 18568c2ecf20Sopenharmony_ci goto out; 18578c2ecf20Sopenharmony_ci } 18588c2ecf20Sopenharmony_ci 18598c2ecf20Sopenharmony_ci wqe = get_recv_wqe(qp, ind); 18608c2ecf20Sopenharmony_ci prev_wqe = qp->rq.last; 18618c2ecf20Sopenharmony_ci qp->rq.last = wqe; 18628c2ecf20Sopenharmony_ci 18638c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) wqe)->ee_nds = 18648c2ecf20Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_DBD); 18658c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) wqe)->flags = 0; 18668c2ecf20Sopenharmony_ci 18678c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_next_seg); 18688c2ecf20Sopenharmony_ci size = sizeof (struct mthca_next_seg) / 16; 18698c2ecf20Sopenharmony_ci 18708c2ecf20Sopenharmony_ci if (unlikely(wr->num_sge > qp->rq.max_gs)) { 18718c2ecf20Sopenharmony_ci err = -EINVAL; 18728c2ecf20Sopenharmony_ci *bad_wr = wr; 18738c2ecf20Sopenharmony_ci goto out; 18748c2ecf20Sopenharmony_ci } 18758c2ecf20Sopenharmony_ci 18768c2ecf20Sopenharmony_ci for (i = 0; i < wr->num_sge; ++i) { 18778c2ecf20Sopenharmony_ci mthca_set_data_seg(wqe, wr->sg_list + i); 18788c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 18798c2ecf20Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 18808c2ecf20Sopenharmony_ci } 18818c2ecf20Sopenharmony_ci 18828c2ecf20Sopenharmony_ci qp->wrid[ind] = wr->wr_id; 18838c2ecf20Sopenharmony_ci 18848c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) prev_wqe)->ee_nds = 18858c2ecf20Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_DBD | size); 18868c2ecf20Sopenharmony_ci 18878c2ecf20Sopenharmony_ci if (!nreq) 18888c2ecf20Sopenharmony_ci size0 = size; 18898c2ecf20Sopenharmony_ci 18908c2ecf20Sopenharmony_ci ++ind; 18918c2ecf20Sopenharmony_ci if (unlikely(ind >= qp->rq.max)) 18928c2ecf20Sopenharmony_ci ind -= qp->rq.max; 18938c2ecf20Sopenharmony_ci 18948c2ecf20Sopenharmony_ci ++nreq; 18958c2ecf20Sopenharmony_ci if (unlikely(nreq == MTHCA_TAVOR_MAX_WQES_PER_RECV_DB)) { 18968c2ecf20Sopenharmony_ci nreq = 0; 18978c2ecf20Sopenharmony_ci 18988c2ecf20Sopenharmony_ci wmb(); 18998c2ecf20Sopenharmony_ci 19008c2ecf20Sopenharmony_ci mthca_write64((qp->rq.next_ind << qp->rq.wqe_shift) | size0, 19018c2ecf20Sopenharmony_ci qp->qpn << 8, dev->kar + MTHCA_RECEIVE_DOORBELL, 19028c2ecf20Sopenharmony_ci MTHCA_GET_DOORBELL_LOCK(&dev->doorbell_lock)); 19038c2ecf20Sopenharmony_ci 19048c2ecf20Sopenharmony_ci qp->rq.next_ind = ind; 19058c2ecf20Sopenharmony_ci qp->rq.head += MTHCA_TAVOR_MAX_WQES_PER_RECV_DB; 19068c2ecf20Sopenharmony_ci } 19078c2ecf20Sopenharmony_ci } 19088c2ecf20Sopenharmony_ci 19098c2ecf20Sopenharmony_ciout: 19108c2ecf20Sopenharmony_ci if (likely(nreq)) { 19118c2ecf20Sopenharmony_ci wmb(); 19128c2ecf20Sopenharmony_ci 19138c2ecf20Sopenharmony_ci mthca_write64((qp->rq.next_ind << qp->rq.wqe_shift) | size0, 19148c2ecf20Sopenharmony_ci qp->qpn << 8 | nreq, dev->kar + MTHCA_RECEIVE_DOORBELL, 19158c2ecf20Sopenharmony_ci MTHCA_GET_DOORBELL_LOCK(&dev->doorbell_lock)); 19168c2ecf20Sopenharmony_ci } 19178c2ecf20Sopenharmony_ci 19188c2ecf20Sopenharmony_ci qp->rq.next_ind = ind; 19198c2ecf20Sopenharmony_ci qp->rq.head += nreq; 19208c2ecf20Sopenharmony_ci 19218c2ecf20Sopenharmony_ci spin_unlock_irqrestore(&qp->rq.lock, flags); 19228c2ecf20Sopenharmony_ci return err; 19238c2ecf20Sopenharmony_ci} 19248c2ecf20Sopenharmony_ci 19258c2ecf20Sopenharmony_ciint mthca_arbel_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr, 19268c2ecf20Sopenharmony_ci const struct ib_send_wr **bad_wr) 19278c2ecf20Sopenharmony_ci{ 19288c2ecf20Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 19298c2ecf20Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 19308c2ecf20Sopenharmony_ci u32 dbhi; 19318c2ecf20Sopenharmony_ci void *wqe; 19328c2ecf20Sopenharmony_ci void *prev_wqe; 19338c2ecf20Sopenharmony_ci unsigned long flags; 19348c2ecf20Sopenharmony_ci int err = 0; 19358c2ecf20Sopenharmony_ci int nreq; 19368c2ecf20Sopenharmony_ci int i; 19378c2ecf20Sopenharmony_ci int size; 19388c2ecf20Sopenharmony_ci /* 19398c2ecf20Sopenharmony_ci * f0 and size0 are only used if nreq != 0, and they will 19408c2ecf20Sopenharmony_ci * always be initialized the first time through the main loop 19418c2ecf20Sopenharmony_ci * before nreq is incremented. So nreq cannot become non-zero 19428c2ecf20Sopenharmony_ci * without initializing f0 and size0, and they are in fact 19438c2ecf20Sopenharmony_ci * never used uninitialized. 19448c2ecf20Sopenharmony_ci */ 19458c2ecf20Sopenharmony_ci int size0; 19468c2ecf20Sopenharmony_ci u32 f0; 19478c2ecf20Sopenharmony_ci int ind; 19488c2ecf20Sopenharmony_ci u8 op0 = 0; 19498c2ecf20Sopenharmony_ci 19508c2ecf20Sopenharmony_ci spin_lock_irqsave(&qp->sq.lock, flags); 19518c2ecf20Sopenharmony_ci 19528c2ecf20Sopenharmony_ci /* XXX check that state is OK to post send */ 19538c2ecf20Sopenharmony_ci 19548c2ecf20Sopenharmony_ci ind = qp->sq.head & (qp->sq.max - 1); 19558c2ecf20Sopenharmony_ci 19568c2ecf20Sopenharmony_ci for (nreq = 0; wr; ++nreq, wr = wr->next) { 19578c2ecf20Sopenharmony_ci if (unlikely(nreq == MTHCA_ARBEL_MAX_WQES_PER_SEND_DB)) { 19588c2ecf20Sopenharmony_ci nreq = 0; 19598c2ecf20Sopenharmony_ci 19608c2ecf20Sopenharmony_ci dbhi = (MTHCA_ARBEL_MAX_WQES_PER_SEND_DB << 24) | 19618c2ecf20Sopenharmony_ci ((qp->sq.head & 0xffff) << 8) | f0 | op0; 19628c2ecf20Sopenharmony_ci 19638c2ecf20Sopenharmony_ci qp->sq.head += MTHCA_ARBEL_MAX_WQES_PER_SEND_DB; 19648c2ecf20Sopenharmony_ci 19658c2ecf20Sopenharmony_ci /* 19668c2ecf20Sopenharmony_ci * Make sure that descriptors are written before 19678c2ecf20Sopenharmony_ci * doorbell record. 19688c2ecf20Sopenharmony_ci */ 19698c2ecf20Sopenharmony_ci wmb(); 19708c2ecf20Sopenharmony_ci *qp->sq.db = cpu_to_be32(qp->sq.head & 0xffff); 19718c2ecf20Sopenharmony_ci 19728c2ecf20Sopenharmony_ci /* 19738c2ecf20Sopenharmony_ci * Make sure doorbell record is written before we 19748c2ecf20Sopenharmony_ci * write MMIO send doorbell. 19758c2ecf20Sopenharmony_ci */ 19768c2ecf20Sopenharmony_ci wmb(); 19778c2ecf20Sopenharmony_ci 19788c2ecf20Sopenharmony_ci mthca_write64(dbhi, (qp->qpn << 8) | size0, 19798c2ecf20Sopenharmony_ci dev->kar + MTHCA_SEND_DOORBELL, 19808c2ecf20Sopenharmony_ci MTHCA_GET_DOORBELL_LOCK(&dev->doorbell_lock)); 19818c2ecf20Sopenharmony_ci } 19828c2ecf20Sopenharmony_ci 19838c2ecf20Sopenharmony_ci if (mthca_wq_overflow(&qp->sq, nreq, qp->ibqp.send_cq)) { 19848c2ecf20Sopenharmony_ci mthca_err(dev, "SQ %06x full (%u head, %u tail," 19858c2ecf20Sopenharmony_ci " %d max, %d nreq)\n", qp->qpn, 19868c2ecf20Sopenharmony_ci qp->sq.head, qp->sq.tail, 19878c2ecf20Sopenharmony_ci qp->sq.max, nreq); 19888c2ecf20Sopenharmony_ci err = -ENOMEM; 19898c2ecf20Sopenharmony_ci *bad_wr = wr; 19908c2ecf20Sopenharmony_ci goto out; 19918c2ecf20Sopenharmony_ci } 19928c2ecf20Sopenharmony_ci 19938c2ecf20Sopenharmony_ci wqe = get_send_wqe(qp, ind); 19948c2ecf20Sopenharmony_ci prev_wqe = qp->sq.last; 19958c2ecf20Sopenharmony_ci qp->sq.last = wqe; 19968c2ecf20Sopenharmony_ci 19978c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) wqe)->flags = 19988c2ecf20Sopenharmony_ci ((wr->send_flags & IB_SEND_SIGNALED) ? 19998c2ecf20Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_CQ_UPDATE) : 0) | 20008c2ecf20Sopenharmony_ci ((wr->send_flags & IB_SEND_SOLICITED) ? 20018c2ecf20Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_SOLICIT) : 0) | 20028c2ecf20Sopenharmony_ci ((wr->send_flags & IB_SEND_IP_CSUM) ? 20038c2ecf20Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_IP_CSUM | MTHCA_NEXT_TCP_UDP_CSUM) : 0) | 20048c2ecf20Sopenharmony_ci cpu_to_be32(1); 20058c2ecf20Sopenharmony_ci if (wr->opcode == IB_WR_SEND_WITH_IMM || 20068c2ecf20Sopenharmony_ci wr->opcode == IB_WR_RDMA_WRITE_WITH_IMM) 20078c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) wqe)->imm = wr->ex.imm_data; 20088c2ecf20Sopenharmony_ci 20098c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_next_seg); 20108c2ecf20Sopenharmony_ci size = sizeof (struct mthca_next_seg) / 16; 20118c2ecf20Sopenharmony_ci 20128c2ecf20Sopenharmony_ci switch (qp->transport) { 20138c2ecf20Sopenharmony_ci case RC: 20148c2ecf20Sopenharmony_ci switch (wr->opcode) { 20158c2ecf20Sopenharmony_ci case IB_WR_ATOMIC_CMP_AND_SWP: 20168c2ecf20Sopenharmony_ci case IB_WR_ATOMIC_FETCH_AND_ADD: 20178c2ecf20Sopenharmony_ci set_raddr_seg(wqe, atomic_wr(wr)->remote_addr, 20188c2ecf20Sopenharmony_ci atomic_wr(wr)->rkey); 20198c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 20208c2ecf20Sopenharmony_ci 20218c2ecf20Sopenharmony_ci set_atomic_seg(wqe, atomic_wr(wr)); 20228c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_atomic_seg); 20238c2ecf20Sopenharmony_ci size += (sizeof (struct mthca_raddr_seg) + 20248c2ecf20Sopenharmony_ci sizeof (struct mthca_atomic_seg)) / 16; 20258c2ecf20Sopenharmony_ci break; 20268c2ecf20Sopenharmony_ci 20278c2ecf20Sopenharmony_ci case IB_WR_RDMA_READ: 20288c2ecf20Sopenharmony_ci case IB_WR_RDMA_WRITE: 20298c2ecf20Sopenharmony_ci case IB_WR_RDMA_WRITE_WITH_IMM: 20308c2ecf20Sopenharmony_ci set_raddr_seg(wqe, rdma_wr(wr)->remote_addr, 20318c2ecf20Sopenharmony_ci rdma_wr(wr)->rkey); 20328c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 20338c2ecf20Sopenharmony_ci size += sizeof (struct mthca_raddr_seg) / 16; 20348c2ecf20Sopenharmony_ci break; 20358c2ecf20Sopenharmony_ci 20368c2ecf20Sopenharmony_ci default: 20378c2ecf20Sopenharmony_ci /* No extra segments required for sends */ 20388c2ecf20Sopenharmony_ci break; 20398c2ecf20Sopenharmony_ci } 20408c2ecf20Sopenharmony_ci 20418c2ecf20Sopenharmony_ci break; 20428c2ecf20Sopenharmony_ci 20438c2ecf20Sopenharmony_ci case UC: 20448c2ecf20Sopenharmony_ci switch (wr->opcode) { 20458c2ecf20Sopenharmony_ci case IB_WR_RDMA_WRITE: 20468c2ecf20Sopenharmony_ci case IB_WR_RDMA_WRITE_WITH_IMM: 20478c2ecf20Sopenharmony_ci set_raddr_seg(wqe, rdma_wr(wr)->remote_addr, 20488c2ecf20Sopenharmony_ci rdma_wr(wr)->rkey); 20498c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_raddr_seg); 20508c2ecf20Sopenharmony_ci size += sizeof (struct mthca_raddr_seg) / 16; 20518c2ecf20Sopenharmony_ci break; 20528c2ecf20Sopenharmony_ci 20538c2ecf20Sopenharmony_ci default: 20548c2ecf20Sopenharmony_ci /* No extra segments required for sends */ 20558c2ecf20Sopenharmony_ci break; 20568c2ecf20Sopenharmony_ci } 20578c2ecf20Sopenharmony_ci 20588c2ecf20Sopenharmony_ci break; 20598c2ecf20Sopenharmony_ci 20608c2ecf20Sopenharmony_ci case UD: 20618c2ecf20Sopenharmony_ci set_arbel_ud_seg(wqe, ud_wr(wr)); 20628c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_arbel_ud_seg); 20638c2ecf20Sopenharmony_ci size += sizeof (struct mthca_arbel_ud_seg) / 16; 20648c2ecf20Sopenharmony_ci break; 20658c2ecf20Sopenharmony_ci 20668c2ecf20Sopenharmony_ci case MLX: 20678c2ecf20Sopenharmony_ci err = build_mlx_header( 20688c2ecf20Sopenharmony_ci dev, qp, ind, ud_wr(wr), 20698c2ecf20Sopenharmony_ci wqe - sizeof(struct mthca_next_seg), wqe); 20708c2ecf20Sopenharmony_ci if (err) { 20718c2ecf20Sopenharmony_ci *bad_wr = wr; 20728c2ecf20Sopenharmony_ci goto out; 20738c2ecf20Sopenharmony_ci } 20748c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 20758c2ecf20Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 20768c2ecf20Sopenharmony_ci break; 20778c2ecf20Sopenharmony_ci } 20788c2ecf20Sopenharmony_ci 20798c2ecf20Sopenharmony_ci if (wr->num_sge > qp->sq.max_gs) { 20808c2ecf20Sopenharmony_ci mthca_err(dev, "too many gathers\n"); 20818c2ecf20Sopenharmony_ci err = -EINVAL; 20828c2ecf20Sopenharmony_ci *bad_wr = wr; 20838c2ecf20Sopenharmony_ci goto out; 20848c2ecf20Sopenharmony_ci } 20858c2ecf20Sopenharmony_ci 20868c2ecf20Sopenharmony_ci for (i = 0; i < wr->num_sge; ++i) { 20878c2ecf20Sopenharmony_ci mthca_set_data_seg(wqe, wr->sg_list + i); 20888c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 20898c2ecf20Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 20908c2ecf20Sopenharmony_ci } 20918c2ecf20Sopenharmony_ci 20928c2ecf20Sopenharmony_ci /* Add one more inline data segment for ICRC */ 20938c2ecf20Sopenharmony_ci if (qp->transport == MLX) { 20948c2ecf20Sopenharmony_ci ((struct mthca_data_seg *) wqe)->byte_count = 20958c2ecf20Sopenharmony_ci cpu_to_be32((1 << 31) | 4); 20968c2ecf20Sopenharmony_ci ((u32 *) wqe)[1] = 0; 20978c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 20988c2ecf20Sopenharmony_ci size += sizeof (struct mthca_data_seg) / 16; 20998c2ecf20Sopenharmony_ci } 21008c2ecf20Sopenharmony_ci 21018c2ecf20Sopenharmony_ci qp->wrid[ind + qp->rq.max] = wr->wr_id; 21028c2ecf20Sopenharmony_ci 21038c2ecf20Sopenharmony_ci if (wr->opcode >= ARRAY_SIZE(mthca_opcode)) { 21048c2ecf20Sopenharmony_ci mthca_err(dev, "opcode invalid\n"); 21058c2ecf20Sopenharmony_ci err = -EINVAL; 21068c2ecf20Sopenharmony_ci *bad_wr = wr; 21078c2ecf20Sopenharmony_ci goto out; 21088c2ecf20Sopenharmony_ci } 21098c2ecf20Sopenharmony_ci 21108c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) prev_wqe)->nda_op = 21118c2ecf20Sopenharmony_ci cpu_to_be32(((ind << qp->sq.wqe_shift) + 21128c2ecf20Sopenharmony_ci qp->send_wqe_offset) | 21138c2ecf20Sopenharmony_ci mthca_opcode[wr->opcode]); 21148c2ecf20Sopenharmony_ci wmb(); 21158c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) prev_wqe)->ee_nds = 21168c2ecf20Sopenharmony_ci cpu_to_be32(MTHCA_NEXT_DBD | size | 21178c2ecf20Sopenharmony_ci ((wr->send_flags & IB_SEND_FENCE) ? 21188c2ecf20Sopenharmony_ci MTHCA_NEXT_FENCE : 0)); 21198c2ecf20Sopenharmony_ci 21208c2ecf20Sopenharmony_ci if (!nreq) { 21218c2ecf20Sopenharmony_ci size0 = size; 21228c2ecf20Sopenharmony_ci op0 = mthca_opcode[wr->opcode]; 21238c2ecf20Sopenharmony_ci f0 = wr->send_flags & IB_SEND_FENCE ? 21248c2ecf20Sopenharmony_ci MTHCA_SEND_DOORBELL_FENCE : 0; 21258c2ecf20Sopenharmony_ci } 21268c2ecf20Sopenharmony_ci 21278c2ecf20Sopenharmony_ci ++ind; 21288c2ecf20Sopenharmony_ci if (unlikely(ind >= qp->sq.max)) 21298c2ecf20Sopenharmony_ci ind -= qp->sq.max; 21308c2ecf20Sopenharmony_ci } 21318c2ecf20Sopenharmony_ci 21328c2ecf20Sopenharmony_ciout: 21338c2ecf20Sopenharmony_ci if (likely(nreq)) { 21348c2ecf20Sopenharmony_ci dbhi = (nreq << 24) | ((qp->sq.head & 0xffff) << 8) | f0 | op0; 21358c2ecf20Sopenharmony_ci 21368c2ecf20Sopenharmony_ci qp->sq.head += nreq; 21378c2ecf20Sopenharmony_ci 21388c2ecf20Sopenharmony_ci /* 21398c2ecf20Sopenharmony_ci * Make sure that descriptors are written before 21408c2ecf20Sopenharmony_ci * doorbell record. 21418c2ecf20Sopenharmony_ci */ 21428c2ecf20Sopenharmony_ci wmb(); 21438c2ecf20Sopenharmony_ci *qp->sq.db = cpu_to_be32(qp->sq.head & 0xffff); 21448c2ecf20Sopenharmony_ci 21458c2ecf20Sopenharmony_ci /* 21468c2ecf20Sopenharmony_ci * Make sure doorbell record is written before we 21478c2ecf20Sopenharmony_ci * write MMIO send doorbell. 21488c2ecf20Sopenharmony_ci */ 21498c2ecf20Sopenharmony_ci wmb(); 21508c2ecf20Sopenharmony_ci 21518c2ecf20Sopenharmony_ci mthca_write64(dbhi, (qp->qpn << 8) | size0, dev->kar + MTHCA_SEND_DOORBELL, 21528c2ecf20Sopenharmony_ci MTHCA_GET_DOORBELL_LOCK(&dev->doorbell_lock)); 21538c2ecf20Sopenharmony_ci } 21548c2ecf20Sopenharmony_ci 21558c2ecf20Sopenharmony_ci spin_unlock_irqrestore(&qp->sq.lock, flags); 21568c2ecf20Sopenharmony_ci return err; 21578c2ecf20Sopenharmony_ci} 21588c2ecf20Sopenharmony_ci 21598c2ecf20Sopenharmony_ciint mthca_arbel_post_receive(struct ib_qp *ibqp, const struct ib_recv_wr *wr, 21608c2ecf20Sopenharmony_ci const struct ib_recv_wr **bad_wr) 21618c2ecf20Sopenharmony_ci{ 21628c2ecf20Sopenharmony_ci struct mthca_dev *dev = to_mdev(ibqp->device); 21638c2ecf20Sopenharmony_ci struct mthca_qp *qp = to_mqp(ibqp); 21648c2ecf20Sopenharmony_ci unsigned long flags; 21658c2ecf20Sopenharmony_ci int err = 0; 21668c2ecf20Sopenharmony_ci int nreq; 21678c2ecf20Sopenharmony_ci int ind; 21688c2ecf20Sopenharmony_ci int i; 21698c2ecf20Sopenharmony_ci void *wqe; 21708c2ecf20Sopenharmony_ci 21718c2ecf20Sopenharmony_ci spin_lock_irqsave(&qp->rq.lock, flags); 21728c2ecf20Sopenharmony_ci 21738c2ecf20Sopenharmony_ci /* XXX check that state is OK to post receive */ 21748c2ecf20Sopenharmony_ci 21758c2ecf20Sopenharmony_ci ind = qp->rq.head & (qp->rq.max - 1); 21768c2ecf20Sopenharmony_ci 21778c2ecf20Sopenharmony_ci for (nreq = 0; wr; ++nreq, wr = wr->next) { 21788c2ecf20Sopenharmony_ci if (mthca_wq_overflow(&qp->rq, nreq, qp->ibqp.recv_cq)) { 21798c2ecf20Sopenharmony_ci mthca_err(dev, "RQ %06x full (%u head, %u tail," 21808c2ecf20Sopenharmony_ci " %d max, %d nreq)\n", qp->qpn, 21818c2ecf20Sopenharmony_ci qp->rq.head, qp->rq.tail, 21828c2ecf20Sopenharmony_ci qp->rq.max, nreq); 21838c2ecf20Sopenharmony_ci err = -ENOMEM; 21848c2ecf20Sopenharmony_ci *bad_wr = wr; 21858c2ecf20Sopenharmony_ci goto out; 21868c2ecf20Sopenharmony_ci } 21878c2ecf20Sopenharmony_ci 21888c2ecf20Sopenharmony_ci wqe = get_recv_wqe(qp, ind); 21898c2ecf20Sopenharmony_ci 21908c2ecf20Sopenharmony_ci ((struct mthca_next_seg *) wqe)->flags = 0; 21918c2ecf20Sopenharmony_ci 21928c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_next_seg); 21938c2ecf20Sopenharmony_ci 21948c2ecf20Sopenharmony_ci if (unlikely(wr->num_sge > qp->rq.max_gs)) { 21958c2ecf20Sopenharmony_ci err = -EINVAL; 21968c2ecf20Sopenharmony_ci *bad_wr = wr; 21978c2ecf20Sopenharmony_ci goto out; 21988c2ecf20Sopenharmony_ci } 21998c2ecf20Sopenharmony_ci 22008c2ecf20Sopenharmony_ci for (i = 0; i < wr->num_sge; ++i) { 22018c2ecf20Sopenharmony_ci mthca_set_data_seg(wqe, wr->sg_list + i); 22028c2ecf20Sopenharmony_ci wqe += sizeof (struct mthca_data_seg); 22038c2ecf20Sopenharmony_ci } 22048c2ecf20Sopenharmony_ci 22058c2ecf20Sopenharmony_ci if (i < qp->rq.max_gs) 22068c2ecf20Sopenharmony_ci mthca_set_data_seg_inval(wqe); 22078c2ecf20Sopenharmony_ci 22088c2ecf20Sopenharmony_ci qp->wrid[ind] = wr->wr_id; 22098c2ecf20Sopenharmony_ci 22108c2ecf20Sopenharmony_ci ++ind; 22118c2ecf20Sopenharmony_ci if (unlikely(ind >= qp->rq.max)) 22128c2ecf20Sopenharmony_ci ind -= qp->rq.max; 22138c2ecf20Sopenharmony_ci } 22148c2ecf20Sopenharmony_ciout: 22158c2ecf20Sopenharmony_ci if (likely(nreq)) { 22168c2ecf20Sopenharmony_ci qp->rq.head += nreq; 22178c2ecf20Sopenharmony_ci 22188c2ecf20Sopenharmony_ci /* 22198c2ecf20Sopenharmony_ci * Make sure that descriptors are written before 22208c2ecf20Sopenharmony_ci * doorbell record. 22218c2ecf20Sopenharmony_ci */ 22228c2ecf20Sopenharmony_ci wmb(); 22238c2ecf20Sopenharmony_ci *qp->rq.db = cpu_to_be32(qp->rq.head & 0xffff); 22248c2ecf20Sopenharmony_ci } 22258c2ecf20Sopenharmony_ci 22268c2ecf20Sopenharmony_ci spin_unlock_irqrestore(&qp->rq.lock, flags); 22278c2ecf20Sopenharmony_ci return err; 22288c2ecf20Sopenharmony_ci} 22298c2ecf20Sopenharmony_ci 22308c2ecf20Sopenharmony_civoid mthca_free_err_wqe(struct mthca_dev *dev, struct mthca_qp *qp, int is_send, 22318c2ecf20Sopenharmony_ci int index, int *dbd, __be32 *new_wqe) 22328c2ecf20Sopenharmony_ci{ 22338c2ecf20Sopenharmony_ci struct mthca_next_seg *next; 22348c2ecf20Sopenharmony_ci 22358c2ecf20Sopenharmony_ci /* 22368c2ecf20Sopenharmony_ci * For SRQs, all receive WQEs generate a CQE, so we're always 22378c2ecf20Sopenharmony_ci * at the end of the doorbell chain. 22388c2ecf20Sopenharmony_ci */ 22398c2ecf20Sopenharmony_ci if (qp->ibqp.srq && !is_send) { 22408c2ecf20Sopenharmony_ci *new_wqe = 0; 22418c2ecf20Sopenharmony_ci return; 22428c2ecf20Sopenharmony_ci } 22438c2ecf20Sopenharmony_ci 22448c2ecf20Sopenharmony_ci if (is_send) 22458c2ecf20Sopenharmony_ci next = get_send_wqe(qp, index); 22468c2ecf20Sopenharmony_ci else 22478c2ecf20Sopenharmony_ci next = get_recv_wqe(qp, index); 22488c2ecf20Sopenharmony_ci 22498c2ecf20Sopenharmony_ci *dbd = !!(next->ee_nds & cpu_to_be32(MTHCA_NEXT_DBD)); 22508c2ecf20Sopenharmony_ci if (next->ee_nds & cpu_to_be32(0x3f)) 22518c2ecf20Sopenharmony_ci *new_wqe = (next->nda_op & cpu_to_be32(~0x3f)) | 22528c2ecf20Sopenharmony_ci (next->ee_nds & cpu_to_be32(0x3f)); 22538c2ecf20Sopenharmony_ci else 22548c2ecf20Sopenharmony_ci *new_wqe = 0; 22558c2ecf20Sopenharmony_ci} 22568c2ecf20Sopenharmony_ci 22578c2ecf20Sopenharmony_ciint mthca_init_qp_table(struct mthca_dev *dev) 22588c2ecf20Sopenharmony_ci{ 22598c2ecf20Sopenharmony_ci int err; 22608c2ecf20Sopenharmony_ci int i; 22618c2ecf20Sopenharmony_ci 22628c2ecf20Sopenharmony_ci spin_lock_init(&dev->qp_table.lock); 22638c2ecf20Sopenharmony_ci 22648c2ecf20Sopenharmony_ci /* 22658c2ecf20Sopenharmony_ci * We reserve 2 extra QPs per port for the special QPs. The 22668c2ecf20Sopenharmony_ci * special QP for port 1 has to be even, so round up. 22678c2ecf20Sopenharmony_ci */ 22688c2ecf20Sopenharmony_ci dev->qp_table.sqp_start = (dev->limits.reserved_qps + 1) & ~1UL; 22698c2ecf20Sopenharmony_ci err = mthca_alloc_init(&dev->qp_table.alloc, 22708c2ecf20Sopenharmony_ci dev->limits.num_qps, 22718c2ecf20Sopenharmony_ci (1 << 24) - 1, 22728c2ecf20Sopenharmony_ci dev->qp_table.sqp_start + 22738c2ecf20Sopenharmony_ci MTHCA_MAX_PORTS * 2); 22748c2ecf20Sopenharmony_ci if (err) 22758c2ecf20Sopenharmony_ci return err; 22768c2ecf20Sopenharmony_ci 22778c2ecf20Sopenharmony_ci err = mthca_array_init(&dev->qp_table.qp, 22788c2ecf20Sopenharmony_ci dev->limits.num_qps); 22798c2ecf20Sopenharmony_ci if (err) { 22808c2ecf20Sopenharmony_ci mthca_alloc_cleanup(&dev->qp_table.alloc); 22818c2ecf20Sopenharmony_ci return err; 22828c2ecf20Sopenharmony_ci } 22838c2ecf20Sopenharmony_ci 22848c2ecf20Sopenharmony_ci for (i = 0; i < 2; ++i) { 22858c2ecf20Sopenharmony_ci err = mthca_CONF_SPECIAL_QP(dev, i ? IB_QPT_GSI : IB_QPT_SMI, 22868c2ecf20Sopenharmony_ci dev->qp_table.sqp_start + i * 2); 22878c2ecf20Sopenharmony_ci if (err) { 22888c2ecf20Sopenharmony_ci mthca_warn(dev, "CONF_SPECIAL_QP returned " 22898c2ecf20Sopenharmony_ci "%d, aborting.\n", err); 22908c2ecf20Sopenharmony_ci goto err_out; 22918c2ecf20Sopenharmony_ci } 22928c2ecf20Sopenharmony_ci } 22938c2ecf20Sopenharmony_ci return 0; 22948c2ecf20Sopenharmony_ci 22958c2ecf20Sopenharmony_ci err_out: 22968c2ecf20Sopenharmony_ci for (i = 0; i < 2; ++i) 22978c2ecf20Sopenharmony_ci mthca_CONF_SPECIAL_QP(dev, i, 0); 22988c2ecf20Sopenharmony_ci 22998c2ecf20Sopenharmony_ci mthca_array_cleanup(&dev->qp_table.qp, dev->limits.num_qps); 23008c2ecf20Sopenharmony_ci mthca_alloc_cleanup(&dev->qp_table.alloc); 23018c2ecf20Sopenharmony_ci 23028c2ecf20Sopenharmony_ci return err; 23038c2ecf20Sopenharmony_ci} 23048c2ecf20Sopenharmony_ci 23058c2ecf20Sopenharmony_civoid mthca_cleanup_qp_table(struct mthca_dev *dev) 23068c2ecf20Sopenharmony_ci{ 23078c2ecf20Sopenharmony_ci int i; 23088c2ecf20Sopenharmony_ci 23098c2ecf20Sopenharmony_ci for (i = 0; i < 2; ++i) 23108c2ecf20Sopenharmony_ci mthca_CONF_SPECIAL_QP(dev, i, 0); 23118c2ecf20Sopenharmony_ci 23128c2ecf20Sopenharmony_ci mthca_array_cleanup(&dev->qp_table.qp, dev->limits.num_qps); 23138c2ecf20Sopenharmony_ci mthca_alloc_cleanup(&dev->qp_table.alloc); 23148c2ecf20Sopenharmony_ci} 2315