18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 or BSD-3-Clause 28c2ecf20Sopenharmony_ci 38c2ecf20Sopenharmony_ci/* Authors: Bernard Metzler <bmt@zurich.ibm.com> */ 48c2ecf20Sopenharmony_ci/* Copyright (c) 2008-2019, IBM Corporation */ 58c2ecf20Sopenharmony_ci 68c2ecf20Sopenharmony_ci#include <linux/errno.h> 78c2ecf20Sopenharmony_ci#include <linux/types.h> 88c2ecf20Sopenharmony_ci#include <linux/uaccess.h> 98c2ecf20Sopenharmony_ci#include <linux/vmalloc.h> 108c2ecf20Sopenharmony_ci#include <linux/xarray.h> 118c2ecf20Sopenharmony_ci 128c2ecf20Sopenharmony_ci#include <rdma/iw_cm.h> 138c2ecf20Sopenharmony_ci#include <rdma/ib_verbs.h> 148c2ecf20Sopenharmony_ci#include <rdma/ib_user_verbs.h> 158c2ecf20Sopenharmony_ci#include <rdma/uverbs_ioctl.h> 168c2ecf20Sopenharmony_ci 178c2ecf20Sopenharmony_ci#include "siw.h" 188c2ecf20Sopenharmony_ci#include "siw_verbs.h" 198c2ecf20Sopenharmony_ci#include "siw_mem.h" 208c2ecf20Sopenharmony_ci 218c2ecf20Sopenharmony_cistatic int ib_qp_state_to_siw_qp_state[IB_QPS_ERR + 1] = { 228c2ecf20Sopenharmony_ci [IB_QPS_RESET] = SIW_QP_STATE_IDLE, 238c2ecf20Sopenharmony_ci [IB_QPS_INIT] = SIW_QP_STATE_IDLE, 248c2ecf20Sopenharmony_ci [IB_QPS_RTR] = SIW_QP_STATE_RTR, 258c2ecf20Sopenharmony_ci [IB_QPS_RTS] = SIW_QP_STATE_RTS, 268c2ecf20Sopenharmony_ci [IB_QPS_SQD] = SIW_QP_STATE_CLOSING, 278c2ecf20Sopenharmony_ci [IB_QPS_SQE] = SIW_QP_STATE_TERMINATE, 288c2ecf20Sopenharmony_ci [IB_QPS_ERR] = SIW_QP_STATE_ERROR 298c2ecf20Sopenharmony_ci}; 308c2ecf20Sopenharmony_ci 318c2ecf20Sopenharmony_cistatic char ib_qp_state_to_string[IB_QPS_ERR + 1][sizeof("RESET")] = { 328c2ecf20Sopenharmony_ci [IB_QPS_RESET] = "RESET", [IB_QPS_INIT] = "INIT", [IB_QPS_RTR] = "RTR", 338c2ecf20Sopenharmony_ci [IB_QPS_RTS] = "RTS", [IB_QPS_SQD] = "SQD", [IB_QPS_SQE] = "SQE", 348c2ecf20Sopenharmony_ci [IB_QPS_ERR] = "ERR" 358c2ecf20Sopenharmony_ci}; 368c2ecf20Sopenharmony_ci 378c2ecf20Sopenharmony_civoid siw_mmap_free(struct rdma_user_mmap_entry *rdma_entry) 388c2ecf20Sopenharmony_ci{ 398c2ecf20Sopenharmony_ci struct siw_user_mmap_entry *entry = to_siw_mmap_entry(rdma_entry); 408c2ecf20Sopenharmony_ci 418c2ecf20Sopenharmony_ci kfree(entry); 428c2ecf20Sopenharmony_ci} 438c2ecf20Sopenharmony_ci 448c2ecf20Sopenharmony_ciint siw_mmap(struct ib_ucontext *ctx, struct vm_area_struct *vma) 458c2ecf20Sopenharmony_ci{ 468c2ecf20Sopenharmony_ci struct siw_ucontext *uctx = to_siw_ctx(ctx); 478c2ecf20Sopenharmony_ci size_t size = vma->vm_end - vma->vm_start; 488c2ecf20Sopenharmony_ci struct rdma_user_mmap_entry *rdma_entry; 498c2ecf20Sopenharmony_ci struct siw_user_mmap_entry *entry; 508c2ecf20Sopenharmony_ci int rv = -EINVAL; 518c2ecf20Sopenharmony_ci 528c2ecf20Sopenharmony_ci /* 538c2ecf20Sopenharmony_ci * Must be page aligned 548c2ecf20Sopenharmony_ci */ 558c2ecf20Sopenharmony_ci if (vma->vm_start & (PAGE_SIZE - 1)) { 568c2ecf20Sopenharmony_ci pr_warn("siw: mmap not page aligned\n"); 578c2ecf20Sopenharmony_ci return -EINVAL; 588c2ecf20Sopenharmony_ci } 598c2ecf20Sopenharmony_ci rdma_entry = rdma_user_mmap_entry_get(&uctx->base_ucontext, vma); 608c2ecf20Sopenharmony_ci if (!rdma_entry) { 618c2ecf20Sopenharmony_ci siw_dbg(&uctx->sdev->base_dev, "mmap lookup failed: %lu, %#zx\n", 628c2ecf20Sopenharmony_ci vma->vm_pgoff, size); 638c2ecf20Sopenharmony_ci return -EINVAL; 648c2ecf20Sopenharmony_ci } 658c2ecf20Sopenharmony_ci entry = to_siw_mmap_entry(rdma_entry); 668c2ecf20Sopenharmony_ci 678c2ecf20Sopenharmony_ci rv = remap_vmalloc_range(vma, entry->address, 0); 688c2ecf20Sopenharmony_ci if (rv) { 698c2ecf20Sopenharmony_ci pr_warn("remap_vmalloc_range failed: %lu, %zu\n", vma->vm_pgoff, 708c2ecf20Sopenharmony_ci size); 718c2ecf20Sopenharmony_ci goto out; 728c2ecf20Sopenharmony_ci } 738c2ecf20Sopenharmony_ciout: 748c2ecf20Sopenharmony_ci rdma_user_mmap_entry_put(rdma_entry); 758c2ecf20Sopenharmony_ci 768c2ecf20Sopenharmony_ci return rv; 778c2ecf20Sopenharmony_ci} 788c2ecf20Sopenharmony_ci 798c2ecf20Sopenharmony_ciint siw_alloc_ucontext(struct ib_ucontext *base_ctx, struct ib_udata *udata) 808c2ecf20Sopenharmony_ci{ 818c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(base_ctx->device); 828c2ecf20Sopenharmony_ci struct siw_ucontext *ctx = to_siw_ctx(base_ctx); 838c2ecf20Sopenharmony_ci struct siw_uresp_alloc_ctx uresp = {}; 848c2ecf20Sopenharmony_ci int rv; 858c2ecf20Sopenharmony_ci 868c2ecf20Sopenharmony_ci if (atomic_inc_return(&sdev->num_ctx) > SIW_MAX_CONTEXT) { 878c2ecf20Sopenharmony_ci rv = -ENOMEM; 888c2ecf20Sopenharmony_ci goto err_out; 898c2ecf20Sopenharmony_ci } 908c2ecf20Sopenharmony_ci ctx->sdev = sdev; 918c2ecf20Sopenharmony_ci 928c2ecf20Sopenharmony_ci uresp.dev_id = sdev->vendor_part_id; 938c2ecf20Sopenharmony_ci 948c2ecf20Sopenharmony_ci if (udata->outlen < sizeof(uresp)) { 958c2ecf20Sopenharmony_ci rv = -EINVAL; 968c2ecf20Sopenharmony_ci goto err_out; 978c2ecf20Sopenharmony_ci } 988c2ecf20Sopenharmony_ci rv = ib_copy_to_udata(udata, &uresp, sizeof(uresp)); 998c2ecf20Sopenharmony_ci if (rv) 1008c2ecf20Sopenharmony_ci goto err_out; 1018c2ecf20Sopenharmony_ci 1028c2ecf20Sopenharmony_ci siw_dbg(base_ctx->device, "success. now %d context(s)\n", 1038c2ecf20Sopenharmony_ci atomic_read(&sdev->num_ctx)); 1048c2ecf20Sopenharmony_ci 1058c2ecf20Sopenharmony_ci return 0; 1068c2ecf20Sopenharmony_ci 1078c2ecf20Sopenharmony_cierr_out: 1088c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_ctx); 1098c2ecf20Sopenharmony_ci siw_dbg(base_ctx->device, "failure %d. now %d context(s)\n", rv, 1108c2ecf20Sopenharmony_ci atomic_read(&sdev->num_ctx)); 1118c2ecf20Sopenharmony_ci 1128c2ecf20Sopenharmony_ci return rv; 1138c2ecf20Sopenharmony_ci} 1148c2ecf20Sopenharmony_ci 1158c2ecf20Sopenharmony_civoid siw_dealloc_ucontext(struct ib_ucontext *base_ctx) 1168c2ecf20Sopenharmony_ci{ 1178c2ecf20Sopenharmony_ci struct siw_ucontext *uctx = to_siw_ctx(base_ctx); 1188c2ecf20Sopenharmony_ci 1198c2ecf20Sopenharmony_ci atomic_dec(&uctx->sdev->num_ctx); 1208c2ecf20Sopenharmony_ci} 1218c2ecf20Sopenharmony_ci 1228c2ecf20Sopenharmony_ciint siw_query_device(struct ib_device *base_dev, struct ib_device_attr *attr, 1238c2ecf20Sopenharmony_ci struct ib_udata *udata) 1248c2ecf20Sopenharmony_ci{ 1258c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(base_dev); 1268c2ecf20Sopenharmony_ci 1278c2ecf20Sopenharmony_ci if (udata->inlen || udata->outlen) 1288c2ecf20Sopenharmony_ci return -EINVAL; 1298c2ecf20Sopenharmony_ci 1308c2ecf20Sopenharmony_ci memset(attr, 0, sizeof(*attr)); 1318c2ecf20Sopenharmony_ci 1328c2ecf20Sopenharmony_ci /* Revisit atomic caps if RFC 7306 gets supported */ 1338c2ecf20Sopenharmony_ci attr->atomic_cap = 0; 1348c2ecf20Sopenharmony_ci attr->device_cap_flags = 1358c2ecf20Sopenharmony_ci IB_DEVICE_MEM_MGT_EXTENSIONS | IB_DEVICE_ALLOW_USER_UNREG; 1368c2ecf20Sopenharmony_ci attr->max_cq = sdev->attrs.max_cq; 1378c2ecf20Sopenharmony_ci attr->max_cqe = sdev->attrs.max_cqe; 1388c2ecf20Sopenharmony_ci attr->max_fast_reg_page_list_len = SIW_MAX_SGE_PBL; 1398c2ecf20Sopenharmony_ci attr->max_mr = sdev->attrs.max_mr; 1408c2ecf20Sopenharmony_ci attr->max_mw = sdev->attrs.max_mw; 1418c2ecf20Sopenharmony_ci attr->max_mr_size = ~0ull; 1428c2ecf20Sopenharmony_ci attr->max_pd = sdev->attrs.max_pd; 1438c2ecf20Sopenharmony_ci attr->max_qp = sdev->attrs.max_qp; 1448c2ecf20Sopenharmony_ci attr->max_qp_init_rd_atom = sdev->attrs.max_ird; 1458c2ecf20Sopenharmony_ci attr->max_qp_rd_atom = sdev->attrs.max_ord; 1468c2ecf20Sopenharmony_ci attr->max_qp_wr = sdev->attrs.max_qp_wr; 1478c2ecf20Sopenharmony_ci attr->max_recv_sge = sdev->attrs.max_sge; 1488c2ecf20Sopenharmony_ci attr->max_res_rd_atom = sdev->attrs.max_qp * sdev->attrs.max_ird; 1498c2ecf20Sopenharmony_ci attr->max_send_sge = sdev->attrs.max_sge; 1508c2ecf20Sopenharmony_ci attr->max_sge_rd = sdev->attrs.max_sge_rd; 1518c2ecf20Sopenharmony_ci attr->max_srq = sdev->attrs.max_srq; 1528c2ecf20Sopenharmony_ci attr->max_srq_sge = sdev->attrs.max_srq_sge; 1538c2ecf20Sopenharmony_ci attr->max_srq_wr = sdev->attrs.max_srq_wr; 1548c2ecf20Sopenharmony_ci attr->page_size_cap = PAGE_SIZE; 1558c2ecf20Sopenharmony_ci attr->vendor_id = SIW_VENDOR_ID; 1568c2ecf20Sopenharmony_ci attr->vendor_part_id = sdev->vendor_part_id; 1578c2ecf20Sopenharmony_ci 1588c2ecf20Sopenharmony_ci memcpy(&attr->sys_image_guid, sdev->netdev->dev_addr, 6); 1598c2ecf20Sopenharmony_ci 1608c2ecf20Sopenharmony_ci return 0; 1618c2ecf20Sopenharmony_ci} 1628c2ecf20Sopenharmony_ci 1638c2ecf20Sopenharmony_ciint siw_query_port(struct ib_device *base_dev, u8 port, 1648c2ecf20Sopenharmony_ci struct ib_port_attr *attr) 1658c2ecf20Sopenharmony_ci{ 1668c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(base_dev); 1678c2ecf20Sopenharmony_ci int rv; 1688c2ecf20Sopenharmony_ci 1698c2ecf20Sopenharmony_ci memset(attr, 0, sizeof(*attr)); 1708c2ecf20Sopenharmony_ci 1718c2ecf20Sopenharmony_ci rv = ib_get_eth_speed(base_dev, port, &attr->active_speed, 1728c2ecf20Sopenharmony_ci &attr->active_width); 1738c2ecf20Sopenharmony_ci attr->gid_tbl_len = 1; 1748c2ecf20Sopenharmony_ci attr->max_msg_sz = -1; 1758c2ecf20Sopenharmony_ci attr->max_mtu = ib_mtu_int_to_enum(sdev->netdev->mtu); 1768c2ecf20Sopenharmony_ci attr->active_mtu = ib_mtu_int_to_enum(sdev->netdev->mtu); 1778c2ecf20Sopenharmony_ci attr->phys_state = sdev->state == IB_PORT_ACTIVE ? 1788c2ecf20Sopenharmony_ci IB_PORT_PHYS_STATE_LINK_UP : IB_PORT_PHYS_STATE_DISABLED; 1798c2ecf20Sopenharmony_ci attr->port_cap_flags = IB_PORT_CM_SUP | IB_PORT_DEVICE_MGMT_SUP; 1808c2ecf20Sopenharmony_ci attr->state = sdev->state; 1818c2ecf20Sopenharmony_ci /* 1828c2ecf20Sopenharmony_ci * All zero 1838c2ecf20Sopenharmony_ci * 1848c2ecf20Sopenharmony_ci * attr->lid = 0; 1858c2ecf20Sopenharmony_ci * attr->bad_pkey_cntr = 0; 1868c2ecf20Sopenharmony_ci * attr->qkey_viol_cntr = 0; 1878c2ecf20Sopenharmony_ci * attr->sm_lid = 0; 1888c2ecf20Sopenharmony_ci * attr->lmc = 0; 1898c2ecf20Sopenharmony_ci * attr->max_vl_num = 0; 1908c2ecf20Sopenharmony_ci * attr->sm_sl = 0; 1918c2ecf20Sopenharmony_ci * attr->subnet_timeout = 0; 1928c2ecf20Sopenharmony_ci * attr->init_type_repy = 0; 1938c2ecf20Sopenharmony_ci */ 1948c2ecf20Sopenharmony_ci return rv; 1958c2ecf20Sopenharmony_ci} 1968c2ecf20Sopenharmony_ci 1978c2ecf20Sopenharmony_ciint siw_get_port_immutable(struct ib_device *base_dev, u8 port, 1988c2ecf20Sopenharmony_ci struct ib_port_immutable *port_immutable) 1998c2ecf20Sopenharmony_ci{ 2008c2ecf20Sopenharmony_ci struct ib_port_attr attr; 2018c2ecf20Sopenharmony_ci int rv = siw_query_port(base_dev, port, &attr); 2028c2ecf20Sopenharmony_ci 2038c2ecf20Sopenharmony_ci if (rv) 2048c2ecf20Sopenharmony_ci return rv; 2058c2ecf20Sopenharmony_ci 2068c2ecf20Sopenharmony_ci port_immutable->gid_tbl_len = attr.gid_tbl_len; 2078c2ecf20Sopenharmony_ci port_immutable->core_cap_flags = RDMA_CORE_PORT_IWARP; 2088c2ecf20Sopenharmony_ci 2098c2ecf20Sopenharmony_ci return 0; 2108c2ecf20Sopenharmony_ci} 2118c2ecf20Sopenharmony_ci 2128c2ecf20Sopenharmony_ciint siw_query_gid(struct ib_device *base_dev, u8 port, int idx, 2138c2ecf20Sopenharmony_ci union ib_gid *gid) 2148c2ecf20Sopenharmony_ci{ 2158c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(base_dev); 2168c2ecf20Sopenharmony_ci 2178c2ecf20Sopenharmony_ci /* subnet_prefix == interface_id == 0; */ 2188c2ecf20Sopenharmony_ci memset(gid, 0, sizeof(*gid)); 2198c2ecf20Sopenharmony_ci memcpy(&gid->raw[0], sdev->netdev->dev_addr, 6); 2208c2ecf20Sopenharmony_ci 2218c2ecf20Sopenharmony_ci return 0; 2228c2ecf20Sopenharmony_ci} 2238c2ecf20Sopenharmony_ci 2248c2ecf20Sopenharmony_ciint siw_alloc_pd(struct ib_pd *pd, struct ib_udata *udata) 2258c2ecf20Sopenharmony_ci{ 2268c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(pd->device); 2278c2ecf20Sopenharmony_ci 2288c2ecf20Sopenharmony_ci if (atomic_inc_return(&sdev->num_pd) > SIW_MAX_PD) { 2298c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_pd); 2308c2ecf20Sopenharmony_ci return -ENOMEM; 2318c2ecf20Sopenharmony_ci } 2328c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "now %d PD's(s)\n", atomic_read(&sdev->num_pd)); 2338c2ecf20Sopenharmony_ci 2348c2ecf20Sopenharmony_ci return 0; 2358c2ecf20Sopenharmony_ci} 2368c2ecf20Sopenharmony_ci 2378c2ecf20Sopenharmony_ciint siw_dealloc_pd(struct ib_pd *pd, struct ib_udata *udata) 2388c2ecf20Sopenharmony_ci{ 2398c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(pd->device); 2408c2ecf20Sopenharmony_ci 2418c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "free PD\n"); 2428c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_pd); 2438c2ecf20Sopenharmony_ci return 0; 2448c2ecf20Sopenharmony_ci} 2458c2ecf20Sopenharmony_ci 2468c2ecf20Sopenharmony_civoid siw_qp_get_ref(struct ib_qp *base_qp) 2478c2ecf20Sopenharmony_ci{ 2488c2ecf20Sopenharmony_ci siw_qp_get(to_siw_qp(base_qp)); 2498c2ecf20Sopenharmony_ci} 2508c2ecf20Sopenharmony_ci 2518c2ecf20Sopenharmony_civoid siw_qp_put_ref(struct ib_qp *base_qp) 2528c2ecf20Sopenharmony_ci{ 2538c2ecf20Sopenharmony_ci siw_qp_put(to_siw_qp(base_qp)); 2548c2ecf20Sopenharmony_ci} 2558c2ecf20Sopenharmony_ci 2568c2ecf20Sopenharmony_cistatic struct rdma_user_mmap_entry * 2578c2ecf20Sopenharmony_cisiw_mmap_entry_insert(struct siw_ucontext *uctx, 2588c2ecf20Sopenharmony_ci void *address, size_t length, 2598c2ecf20Sopenharmony_ci u64 *offset) 2608c2ecf20Sopenharmony_ci{ 2618c2ecf20Sopenharmony_ci struct siw_user_mmap_entry *entry = kzalloc(sizeof(*entry), GFP_KERNEL); 2628c2ecf20Sopenharmony_ci int rv; 2638c2ecf20Sopenharmony_ci 2648c2ecf20Sopenharmony_ci *offset = SIW_INVAL_UOBJ_KEY; 2658c2ecf20Sopenharmony_ci if (!entry) 2668c2ecf20Sopenharmony_ci return NULL; 2678c2ecf20Sopenharmony_ci 2688c2ecf20Sopenharmony_ci entry->address = address; 2698c2ecf20Sopenharmony_ci 2708c2ecf20Sopenharmony_ci rv = rdma_user_mmap_entry_insert(&uctx->base_ucontext, 2718c2ecf20Sopenharmony_ci &entry->rdma_entry, 2728c2ecf20Sopenharmony_ci length); 2738c2ecf20Sopenharmony_ci if (rv) { 2748c2ecf20Sopenharmony_ci kfree(entry); 2758c2ecf20Sopenharmony_ci return NULL; 2768c2ecf20Sopenharmony_ci } 2778c2ecf20Sopenharmony_ci 2788c2ecf20Sopenharmony_ci *offset = rdma_user_mmap_get_offset(&entry->rdma_entry); 2798c2ecf20Sopenharmony_ci 2808c2ecf20Sopenharmony_ci return &entry->rdma_entry; 2818c2ecf20Sopenharmony_ci} 2828c2ecf20Sopenharmony_ci 2838c2ecf20Sopenharmony_ci/* 2848c2ecf20Sopenharmony_ci * siw_create_qp() 2858c2ecf20Sopenharmony_ci * 2868c2ecf20Sopenharmony_ci * Create QP of requested size on given device. 2878c2ecf20Sopenharmony_ci * 2888c2ecf20Sopenharmony_ci * @pd: Protection Domain 2898c2ecf20Sopenharmony_ci * @attrs: Initial QP attributes. 2908c2ecf20Sopenharmony_ci * @udata: used to provide QP ID, SQ and RQ size back to user. 2918c2ecf20Sopenharmony_ci */ 2928c2ecf20Sopenharmony_ci 2938c2ecf20Sopenharmony_cistruct ib_qp *siw_create_qp(struct ib_pd *pd, 2948c2ecf20Sopenharmony_ci struct ib_qp_init_attr *attrs, 2958c2ecf20Sopenharmony_ci struct ib_udata *udata) 2968c2ecf20Sopenharmony_ci{ 2978c2ecf20Sopenharmony_ci struct siw_qp *qp = NULL; 2988c2ecf20Sopenharmony_ci struct ib_device *base_dev = pd->device; 2998c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(base_dev); 3008c2ecf20Sopenharmony_ci struct siw_ucontext *uctx = 3018c2ecf20Sopenharmony_ci rdma_udata_to_drv_context(udata, struct siw_ucontext, 3028c2ecf20Sopenharmony_ci base_ucontext); 3038c2ecf20Sopenharmony_ci unsigned long flags; 3048c2ecf20Sopenharmony_ci int num_sqe, num_rqe, rv = 0; 3058c2ecf20Sopenharmony_ci size_t length; 3068c2ecf20Sopenharmony_ci 3078c2ecf20Sopenharmony_ci siw_dbg(base_dev, "create new QP\n"); 3088c2ecf20Sopenharmony_ci 3098c2ecf20Sopenharmony_ci if (atomic_inc_return(&sdev->num_qp) > SIW_MAX_QP) { 3108c2ecf20Sopenharmony_ci siw_dbg(base_dev, "too many QP's\n"); 3118c2ecf20Sopenharmony_ci rv = -ENOMEM; 3128c2ecf20Sopenharmony_ci goto err_out; 3138c2ecf20Sopenharmony_ci } 3148c2ecf20Sopenharmony_ci if (attrs->qp_type != IB_QPT_RC) { 3158c2ecf20Sopenharmony_ci siw_dbg(base_dev, "only RC QP's supported\n"); 3168c2ecf20Sopenharmony_ci rv = -EOPNOTSUPP; 3178c2ecf20Sopenharmony_ci goto err_out; 3188c2ecf20Sopenharmony_ci } 3198c2ecf20Sopenharmony_ci if ((attrs->cap.max_send_wr > SIW_MAX_QP_WR) || 3208c2ecf20Sopenharmony_ci (attrs->cap.max_recv_wr > SIW_MAX_QP_WR) || 3218c2ecf20Sopenharmony_ci (attrs->cap.max_send_sge > SIW_MAX_SGE) || 3228c2ecf20Sopenharmony_ci (attrs->cap.max_recv_sge > SIW_MAX_SGE)) { 3238c2ecf20Sopenharmony_ci siw_dbg(base_dev, "QP size error\n"); 3248c2ecf20Sopenharmony_ci rv = -EINVAL; 3258c2ecf20Sopenharmony_ci goto err_out; 3268c2ecf20Sopenharmony_ci } 3278c2ecf20Sopenharmony_ci if (attrs->cap.max_inline_data > SIW_MAX_INLINE) { 3288c2ecf20Sopenharmony_ci siw_dbg(base_dev, "max inline send: %d > %d\n", 3298c2ecf20Sopenharmony_ci attrs->cap.max_inline_data, (int)SIW_MAX_INLINE); 3308c2ecf20Sopenharmony_ci rv = -EINVAL; 3318c2ecf20Sopenharmony_ci goto err_out; 3328c2ecf20Sopenharmony_ci } 3338c2ecf20Sopenharmony_ci /* 3348c2ecf20Sopenharmony_ci * NOTE: we allow for zero element SQ and RQ WQE's SGL's 3358c2ecf20Sopenharmony_ci * but not for a QP unable to hold any WQE (SQ + RQ) 3368c2ecf20Sopenharmony_ci */ 3378c2ecf20Sopenharmony_ci if (attrs->cap.max_send_wr + attrs->cap.max_recv_wr == 0) { 3388c2ecf20Sopenharmony_ci siw_dbg(base_dev, "QP must have send or receive queue\n"); 3398c2ecf20Sopenharmony_ci rv = -EINVAL; 3408c2ecf20Sopenharmony_ci goto err_out; 3418c2ecf20Sopenharmony_ci } 3428c2ecf20Sopenharmony_ci 3438c2ecf20Sopenharmony_ci if (!attrs->send_cq || (!attrs->recv_cq && !attrs->srq)) { 3448c2ecf20Sopenharmony_ci siw_dbg(base_dev, "send CQ or receive CQ invalid\n"); 3458c2ecf20Sopenharmony_ci rv = -EINVAL; 3468c2ecf20Sopenharmony_ci goto err_out; 3478c2ecf20Sopenharmony_ci } 3488c2ecf20Sopenharmony_ci qp = kzalloc(sizeof(*qp), GFP_KERNEL); 3498c2ecf20Sopenharmony_ci if (!qp) { 3508c2ecf20Sopenharmony_ci rv = -ENOMEM; 3518c2ecf20Sopenharmony_ci goto err_out; 3528c2ecf20Sopenharmony_ci } 3538c2ecf20Sopenharmony_ci init_rwsem(&qp->state_lock); 3548c2ecf20Sopenharmony_ci spin_lock_init(&qp->sq_lock); 3558c2ecf20Sopenharmony_ci spin_lock_init(&qp->rq_lock); 3568c2ecf20Sopenharmony_ci spin_lock_init(&qp->orq_lock); 3578c2ecf20Sopenharmony_ci 3588c2ecf20Sopenharmony_ci rv = siw_qp_add(sdev, qp); 3598c2ecf20Sopenharmony_ci if (rv) 3608c2ecf20Sopenharmony_ci goto err_out; 3618c2ecf20Sopenharmony_ci 3628c2ecf20Sopenharmony_ci num_sqe = attrs->cap.max_send_wr; 3638c2ecf20Sopenharmony_ci num_rqe = attrs->cap.max_recv_wr; 3648c2ecf20Sopenharmony_ci 3658c2ecf20Sopenharmony_ci /* All queue indices are derived from modulo operations 3668c2ecf20Sopenharmony_ci * on a free running 'get' (consumer) and 'put' (producer) 3678c2ecf20Sopenharmony_ci * unsigned counter. Having queue sizes at power of two 3688c2ecf20Sopenharmony_ci * avoids handling counter wrap around. 3698c2ecf20Sopenharmony_ci */ 3708c2ecf20Sopenharmony_ci if (num_sqe) 3718c2ecf20Sopenharmony_ci num_sqe = roundup_pow_of_two(num_sqe); 3728c2ecf20Sopenharmony_ci else { 3738c2ecf20Sopenharmony_ci /* Zero sized SQ is not supported */ 3748c2ecf20Sopenharmony_ci rv = -EINVAL; 3758c2ecf20Sopenharmony_ci goto err_out_xa; 3768c2ecf20Sopenharmony_ci } 3778c2ecf20Sopenharmony_ci if (num_rqe) 3788c2ecf20Sopenharmony_ci num_rqe = roundup_pow_of_two(num_rqe); 3798c2ecf20Sopenharmony_ci 3808c2ecf20Sopenharmony_ci if (udata) 3818c2ecf20Sopenharmony_ci qp->sendq = vmalloc_user(num_sqe * sizeof(struct siw_sqe)); 3828c2ecf20Sopenharmony_ci else 3838c2ecf20Sopenharmony_ci qp->sendq = vzalloc(num_sqe * sizeof(struct siw_sqe)); 3848c2ecf20Sopenharmony_ci 3858c2ecf20Sopenharmony_ci if (qp->sendq == NULL) { 3868c2ecf20Sopenharmony_ci rv = -ENOMEM; 3878c2ecf20Sopenharmony_ci goto err_out_xa; 3888c2ecf20Sopenharmony_ci } 3898c2ecf20Sopenharmony_ci if (attrs->sq_sig_type != IB_SIGNAL_REQ_WR) { 3908c2ecf20Sopenharmony_ci if (attrs->sq_sig_type == IB_SIGNAL_ALL_WR) 3918c2ecf20Sopenharmony_ci qp->attrs.flags |= SIW_SIGNAL_ALL_WR; 3928c2ecf20Sopenharmony_ci else { 3938c2ecf20Sopenharmony_ci rv = -EINVAL; 3948c2ecf20Sopenharmony_ci goto err_out_xa; 3958c2ecf20Sopenharmony_ci } 3968c2ecf20Sopenharmony_ci } 3978c2ecf20Sopenharmony_ci qp->pd = pd; 3988c2ecf20Sopenharmony_ci qp->scq = to_siw_cq(attrs->send_cq); 3998c2ecf20Sopenharmony_ci qp->rcq = to_siw_cq(attrs->recv_cq); 4008c2ecf20Sopenharmony_ci 4018c2ecf20Sopenharmony_ci if (attrs->srq) { 4028c2ecf20Sopenharmony_ci /* 4038c2ecf20Sopenharmony_ci * SRQ support. 4048c2ecf20Sopenharmony_ci * Verbs 6.3.7: ignore RQ size, if SRQ present 4058c2ecf20Sopenharmony_ci * Verbs 6.3.5: do not check PD of SRQ against PD of QP 4068c2ecf20Sopenharmony_ci */ 4078c2ecf20Sopenharmony_ci qp->srq = to_siw_srq(attrs->srq); 4088c2ecf20Sopenharmony_ci qp->attrs.rq_size = 0; 4098c2ecf20Sopenharmony_ci siw_dbg(base_dev, "QP [%u]: SRQ attached\n", 4108c2ecf20Sopenharmony_ci qp->base_qp.qp_num); 4118c2ecf20Sopenharmony_ci } else if (num_rqe) { 4128c2ecf20Sopenharmony_ci if (udata) 4138c2ecf20Sopenharmony_ci qp->recvq = 4148c2ecf20Sopenharmony_ci vmalloc_user(num_rqe * sizeof(struct siw_rqe)); 4158c2ecf20Sopenharmony_ci else 4168c2ecf20Sopenharmony_ci qp->recvq = vzalloc(num_rqe * sizeof(struct siw_rqe)); 4178c2ecf20Sopenharmony_ci 4188c2ecf20Sopenharmony_ci if (qp->recvq == NULL) { 4198c2ecf20Sopenharmony_ci rv = -ENOMEM; 4208c2ecf20Sopenharmony_ci goto err_out_xa; 4218c2ecf20Sopenharmony_ci } 4228c2ecf20Sopenharmony_ci qp->attrs.rq_size = num_rqe; 4238c2ecf20Sopenharmony_ci } 4248c2ecf20Sopenharmony_ci qp->attrs.sq_size = num_sqe; 4258c2ecf20Sopenharmony_ci qp->attrs.sq_max_sges = attrs->cap.max_send_sge; 4268c2ecf20Sopenharmony_ci qp->attrs.rq_max_sges = attrs->cap.max_recv_sge; 4278c2ecf20Sopenharmony_ci 4288c2ecf20Sopenharmony_ci /* Make those two tunables fixed for now. */ 4298c2ecf20Sopenharmony_ci qp->tx_ctx.gso_seg_limit = 1; 4308c2ecf20Sopenharmony_ci qp->tx_ctx.zcopy_tx = zcopy_tx; 4318c2ecf20Sopenharmony_ci 4328c2ecf20Sopenharmony_ci qp->attrs.state = SIW_QP_STATE_IDLE; 4338c2ecf20Sopenharmony_ci 4348c2ecf20Sopenharmony_ci if (udata) { 4358c2ecf20Sopenharmony_ci struct siw_uresp_create_qp uresp = {}; 4368c2ecf20Sopenharmony_ci 4378c2ecf20Sopenharmony_ci uresp.num_sqe = num_sqe; 4388c2ecf20Sopenharmony_ci uresp.num_rqe = num_rqe; 4398c2ecf20Sopenharmony_ci uresp.qp_id = qp_id(qp); 4408c2ecf20Sopenharmony_ci 4418c2ecf20Sopenharmony_ci if (qp->sendq) { 4428c2ecf20Sopenharmony_ci length = num_sqe * sizeof(struct siw_sqe); 4438c2ecf20Sopenharmony_ci qp->sq_entry = 4448c2ecf20Sopenharmony_ci siw_mmap_entry_insert(uctx, qp->sendq, 4458c2ecf20Sopenharmony_ci length, &uresp.sq_key); 4468c2ecf20Sopenharmony_ci if (!qp->sq_entry) { 4478c2ecf20Sopenharmony_ci rv = -ENOMEM; 4488c2ecf20Sopenharmony_ci goto err_out_xa; 4498c2ecf20Sopenharmony_ci } 4508c2ecf20Sopenharmony_ci } 4518c2ecf20Sopenharmony_ci 4528c2ecf20Sopenharmony_ci if (qp->recvq) { 4538c2ecf20Sopenharmony_ci length = num_rqe * sizeof(struct siw_rqe); 4548c2ecf20Sopenharmony_ci qp->rq_entry = 4558c2ecf20Sopenharmony_ci siw_mmap_entry_insert(uctx, qp->recvq, 4568c2ecf20Sopenharmony_ci length, &uresp.rq_key); 4578c2ecf20Sopenharmony_ci if (!qp->rq_entry) { 4588c2ecf20Sopenharmony_ci uresp.sq_key = SIW_INVAL_UOBJ_KEY; 4598c2ecf20Sopenharmony_ci rv = -ENOMEM; 4608c2ecf20Sopenharmony_ci goto err_out_xa; 4618c2ecf20Sopenharmony_ci } 4628c2ecf20Sopenharmony_ci } 4638c2ecf20Sopenharmony_ci 4648c2ecf20Sopenharmony_ci if (udata->outlen < sizeof(uresp)) { 4658c2ecf20Sopenharmony_ci rv = -EINVAL; 4668c2ecf20Sopenharmony_ci goto err_out_xa; 4678c2ecf20Sopenharmony_ci } 4688c2ecf20Sopenharmony_ci rv = ib_copy_to_udata(udata, &uresp, sizeof(uresp)); 4698c2ecf20Sopenharmony_ci if (rv) 4708c2ecf20Sopenharmony_ci goto err_out_xa; 4718c2ecf20Sopenharmony_ci } 4728c2ecf20Sopenharmony_ci qp->tx_cpu = siw_get_tx_cpu(sdev); 4738c2ecf20Sopenharmony_ci if (qp->tx_cpu < 0) { 4748c2ecf20Sopenharmony_ci rv = -EINVAL; 4758c2ecf20Sopenharmony_ci goto err_out_xa; 4768c2ecf20Sopenharmony_ci } 4778c2ecf20Sopenharmony_ci INIT_LIST_HEAD(&qp->devq); 4788c2ecf20Sopenharmony_ci spin_lock_irqsave(&sdev->lock, flags); 4798c2ecf20Sopenharmony_ci list_add_tail(&qp->devq, &sdev->qp_list); 4808c2ecf20Sopenharmony_ci spin_unlock_irqrestore(&sdev->lock, flags); 4818c2ecf20Sopenharmony_ci 4828c2ecf20Sopenharmony_ci return &qp->base_qp; 4838c2ecf20Sopenharmony_ci 4848c2ecf20Sopenharmony_cierr_out_xa: 4858c2ecf20Sopenharmony_ci xa_erase(&sdev->qp_xa, qp_id(qp)); 4868c2ecf20Sopenharmony_cierr_out: 4878c2ecf20Sopenharmony_ci if (qp) { 4888c2ecf20Sopenharmony_ci if (uctx) { 4898c2ecf20Sopenharmony_ci rdma_user_mmap_entry_remove(qp->sq_entry); 4908c2ecf20Sopenharmony_ci rdma_user_mmap_entry_remove(qp->rq_entry); 4918c2ecf20Sopenharmony_ci } 4928c2ecf20Sopenharmony_ci vfree(qp->sendq); 4938c2ecf20Sopenharmony_ci vfree(qp->recvq); 4948c2ecf20Sopenharmony_ci kfree(qp); 4958c2ecf20Sopenharmony_ci } 4968c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_qp); 4978c2ecf20Sopenharmony_ci 4988c2ecf20Sopenharmony_ci return ERR_PTR(rv); 4998c2ecf20Sopenharmony_ci} 5008c2ecf20Sopenharmony_ci 5018c2ecf20Sopenharmony_ci/* 5028c2ecf20Sopenharmony_ci * Minimum siw_query_qp() verb interface. 5038c2ecf20Sopenharmony_ci * 5048c2ecf20Sopenharmony_ci * @qp_attr_mask is not used but all available information is provided 5058c2ecf20Sopenharmony_ci */ 5068c2ecf20Sopenharmony_ciint siw_query_qp(struct ib_qp *base_qp, struct ib_qp_attr *qp_attr, 5078c2ecf20Sopenharmony_ci int qp_attr_mask, struct ib_qp_init_attr *qp_init_attr) 5088c2ecf20Sopenharmony_ci{ 5098c2ecf20Sopenharmony_ci struct siw_qp *qp; 5108c2ecf20Sopenharmony_ci struct siw_device *sdev; 5118c2ecf20Sopenharmony_ci 5128c2ecf20Sopenharmony_ci if (base_qp && qp_attr && qp_init_attr) { 5138c2ecf20Sopenharmony_ci qp = to_siw_qp(base_qp); 5148c2ecf20Sopenharmony_ci sdev = to_siw_dev(base_qp->device); 5158c2ecf20Sopenharmony_ci } else { 5168c2ecf20Sopenharmony_ci return -EINVAL; 5178c2ecf20Sopenharmony_ci } 5188c2ecf20Sopenharmony_ci qp_attr->cap.max_inline_data = SIW_MAX_INLINE; 5198c2ecf20Sopenharmony_ci qp_attr->cap.max_send_wr = qp->attrs.sq_size; 5208c2ecf20Sopenharmony_ci qp_attr->cap.max_send_sge = qp->attrs.sq_max_sges; 5218c2ecf20Sopenharmony_ci qp_attr->cap.max_recv_wr = qp->attrs.rq_size; 5228c2ecf20Sopenharmony_ci qp_attr->cap.max_recv_sge = qp->attrs.rq_max_sges; 5238c2ecf20Sopenharmony_ci qp_attr->path_mtu = ib_mtu_int_to_enum(sdev->netdev->mtu); 5248c2ecf20Sopenharmony_ci qp_attr->max_rd_atomic = qp->attrs.irq_size; 5258c2ecf20Sopenharmony_ci qp_attr->max_dest_rd_atomic = qp->attrs.orq_size; 5268c2ecf20Sopenharmony_ci 5278c2ecf20Sopenharmony_ci qp_attr->qp_access_flags = IB_ACCESS_LOCAL_WRITE | 5288c2ecf20Sopenharmony_ci IB_ACCESS_REMOTE_WRITE | 5298c2ecf20Sopenharmony_ci IB_ACCESS_REMOTE_READ; 5308c2ecf20Sopenharmony_ci 5318c2ecf20Sopenharmony_ci qp_init_attr->qp_type = base_qp->qp_type; 5328c2ecf20Sopenharmony_ci qp_init_attr->send_cq = base_qp->send_cq; 5338c2ecf20Sopenharmony_ci qp_init_attr->recv_cq = base_qp->recv_cq; 5348c2ecf20Sopenharmony_ci qp_init_attr->srq = base_qp->srq; 5358c2ecf20Sopenharmony_ci 5368c2ecf20Sopenharmony_ci qp_init_attr->cap = qp_attr->cap; 5378c2ecf20Sopenharmony_ci 5388c2ecf20Sopenharmony_ci return 0; 5398c2ecf20Sopenharmony_ci} 5408c2ecf20Sopenharmony_ci 5418c2ecf20Sopenharmony_ciint siw_verbs_modify_qp(struct ib_qp *base_qp, struct ib_qp_attr *attr, 5428c2ecf20Sopenharmony_ci int attr_mask, struct ib_udata *udata) 5438c2ecf20Sopenharmony_ci{ 5448c2ecf20Sopenharmony_ci struct siw_qp_attrs new_attrs; 5458c2ecf20Sopenharmony_ci enum siw_qp_attr_mask siw_attr_mask = 0; 5468c2ecf20Sopenharmony_ci struct siw_qp *qp = to_siw_qp(base_qp); 5478c2ecf20Sopenharmony_ci int rv = 0; 5488c2ecf20Sopenharmony_ci 5498c2ecf20Sopenharmony_ci if (!attr_mask) 5508c2ecf20Sopenharmony_ci return 0; 5518c2ecf20Sopenharmony_ci 5528c2ecf20Sopenharmony_ci memset(&new_attrs, 0, sizeof(new_attrs)); 5538c2ecf20Sopenharmony_ci 5548c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_ACCESS_FLAGS) { 5558c2ecf20Sopenharmony_ci siw_attr_mask = SIW_QP_ATTR_ACCESS_FLAGS; 5568c2ecf20Sopenharmony_ci 5578c2ecf20Sopenharmony_ci if (attr->qp_access_flags & IB_ACCESS_REMOTE_READ) 5588c2ecf20Sopenharmony_ci new_attrs.flags |= SIW_RDMA_READ_ENABLED; 5598c2ecf20Sopenharmony_ci if (attr->qp_access_flags & IB_ACCESS_REMOTE_WRITE) 5608c2ecf20Sopenharmony_ci new_attrs.flags |= SIW_RDMA_WRITE_ENABLED; 5618c2ecf20Sopenharmony_ci if (attr->qp_access_flags & IB_ACCESS_MW_BIND) 5628c2ecf20Sopenharmony_ci new_attrs.flags |= SIW_RDMA_BIND_ENABLED; 5638c2ecf20Sopenharmony_ci } 5648c2ecf20Sopenharmony_ci if (attr_mask & IB_QP_STATE) { 5658c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "desired IB QP state: %s\n", 5668c2ecf20Sopenharmony_ci ib_qp_state_to_string[attr->qp_state]); 5678c2ecf20Sopenharmony_ci 5688c2ecf20Sopenharmony_ci new_attrs.state = ib_qp_state_to_siw_qp_state[attr->qp_state]; 5698c2ecf20Sopenharmony_ci 5708c2ecf20Sopenharmony_ci if (new_attrs.state > SIW_QP_STATE_RTS) 5718c2ecf20Sopenharmony_ci qp->tx_ctx.tx_suspend = 1; 5728c2ecf20Sopenharmony_ci 5738c2ecf20Sopenharmony_ci siw_attr_mask |= SIW_QP_ATTR_STATE; 5748c2ecf20Sopenharmony_ci } 5758c2ecf20Sopenharmony_ci if (!siw_attr_mask) 5768c2ecf20Sopenharmony_ci goto out; 5778c2ecf20Sopenharmony_ci 5788c2ecf20Sopenharmony_ci down_write(&qp->state_lock); 5798c2ecf20Sopenharmony_ci 5808c2ecf20Sopenharmony_ci rv = siw_qp_modify(qp, &new_attrs, siw_attr_mask); 5818c2ecf20Sopenharmony_ci 5828c2ecf20Sopenharmony_ci up_write(&qp->state_lock); 5838c2ecf20Sopenharmony_ciout: 5848c2ecf20Sopenharmony_ci return rv; 5858c2ecf20Sopenharmony_ci} 5868c2ecf20Sopenharmony_ci 5878c2ecf20Sopenharmony_ciint siw_destroy_qp(struct ib_qp *base_qp, struct ib_udata *udata) 5888c2ecf20Sopenharmony_ci{ 5898c2ecf20Sopenharmony_ci struct siw_qp *qp = to_siw_qp(base_qp); 5908c2ecf20Sopenharmony_ci struct siw_ucontext *uctx = 5918c2ecf20Sopenharmony_ci rdma_udata_to_drv_context(udata, struct siw_ucontext, 5928c2ecf20Sopenharmony_ci base_ucontext); 5938c2ecf20Sopenharmony_ci struct siw_qp_attrs qp_attrs; 5948c2ecf20Sopenharmony_ci 5958c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "state %d\n", qp->attrs.state); 5968c2ecf20Sopenharmony_ci 5978c2ecf20Sopenharmony_ci /* 5988c2ecf20Sopenharmony_ci * Mark QP as in process of destruction to prevent from 5998c2ecf20Sopenharmony_ci * any async callbacks to RDMA core 6008c2ecf20Sopenharmony_ci */ 6018c2ecf20Sopenharmony_ci qp->attrs.flags |= SIW_QP_IN_DESTROY; 6028c2ecf20Sopenharmony_ci qp->rx_stream.rx_suspend = 1; 6038c2ecf20Sopenharmony_ci 6048c2ecf20Sopenharmony_ci if (uctx) { 6058c2ecf20Sopenharmony_ci rdma_user_mmap_entry_remove(qp->sq_entry); 6068c2ecf20Sopenharmony_ci rdma_user_mmap_entry_remove(qp->rq_entry); 6078c2ecf20Sopenharmony_ci } 6088c2ecf20Sopenharmony_ci 6098c2ecf20Sopenharmony_ci down_write(&qp->state_lock); 6108c2ecf20Sopenharmony_ci 6118c2ecf20Sopenharmony_ci qp_attrs.state = SIW_QP_STATE_ERROR; 6128c2ecf20Sopenharmony_ci siw_qp_modify(qp, &qp_attrs, SIW_QP_ATTR_STATE); 6138c2ecf20Sopenharmony_ci 6148c2ecf20Sopenharmony_ci if (qp->cep) { 6158c2ecf20Sopenharmony_ci siw_cep_put(qp->cep); 6168c2ecf20Sopenharmony_ci qp->cep = NULL; 6178c2ecf20Sopenharmony_ci } 6188c2ecf20Sopenharmony_ci up_write(&qp->state_lock); 6198c2ecf20Sopenharmony_ci 6208c2ecf20Sopenharmony_ci kfree(qp->tx_ctx.mpa_crc_hd); 6218c2ecf20Sopenharmony_ci kfree(qp->rx_stream.mpa_crc_hd); 6228c2ecf20Sopenharmony_ci 6238c2ecf20Sopenharmony_ci qp->scq = qp->rcq = NULL; 6248c2ecf20Sopenharmony_ci 6258c2ecf20Sopenharmony_ci siw_qp_put(qp); 6268c2ecf20Sopenharmony_ci 6278c2ecf20Sopenharmony_ci return 0; 6288c2ecf20Sopenharmony_ci} 6298c2ecf20Sopenharmony_ci 6308c2ecf20Sopenharmony_ci/* 6318c2ecf20Sopenharmony_ci * siw_copy_inline_sgl() 6328c2ecf20Sopenharmony_ci * 6338c2ecf20Sopenharmony_ci * Prepare sgl of inlined data for sending. For userland callers 6348c2ecf20Sopenharmony_ci * function checks if given buffer addresses and len's are within 6358c2ecf20Sopenharmony_ci * process context bounds. 6368c2ecf20Sopenharmony_ci * Data from all provided sge's are copied together into the wqe, 6378c2ecf20Sopenharmony_ci * referenced by a single sge. 6388c2ecf20Sopenharmony_ci */ 6398c2ecf20Sopenharmony_cistatic int siw_copy_inline_sgl(const struct ib_send_wr *core_wr, 6408c2ecf20Sopenharmony_ci struct siw_sqe *sqe) 6418c2ecf20Sopenharmony_ci{ 6428c2ecf20Sopenharmony_ci struct ib_sge *core_sge = core_wr->sg_list; 6438c2ecf20Sopenharmony_ci void *kbuf = &sqe->sge[1]; 6448c2ecf20Sopenharmony_ci int num_sge = core_wr->num_sge, bytes = 0; 6458c2ecf20Sopenharmony_ci 6468c2ecf20Sopenharmony_ci sqe->sge[0].laddr = (uintptr_t)kbuf; 6478c2ecf20Sopenharmony_ci sqe->sge[0].lkey = 0; 6488c2ecf20Sopenharmony_ci 6498c2ecf20Sopenharmony_ci while (num_sge--) { 6508c2ecf20Sopenharmony_ci if (!core_sge->length) { 6518c2ecf20Sopenharmony_ci core_sge++; 6528c2ecf20Sopenharmony_ci continue; 6538c2ecf20Sopenharmony_ci } 6548c2ecf20Sopenharmony_ci bytes += core_sge->length; 6558c2ecf20Sopenharmony_ci if (bytes > SIW_MAX_INLINE) { 6568c2ecf20Sopenharmony_ci bytes = -EINVAL; 6578c2ecf20Sopenharmony_ci break; 6588c2ecf20Sopenharmony_ci } 6598c2ecf20Sopenharmony_ci memcpy(kbuf, (void *)(uintptr_t)core_sge->addr, 6608c2ecf20Sopenharmony_ci core_sge->length); 6618c2ecf20Sopenharmony_ci 6628c2ecf20Sopenharmony_ci kbuf += core_sge->length; 6638c2ecf20Sopenharmony_ci core_sge++; 6648c2ecf20Sopenharmony_ci } 6658c2ecf20Sopenharmony_ci sqe->sge[0].length = bytes > 0 ? bytes : 0; 6668c2ecf20Sopenharmony_ci sqe->num_sge = bytes > 0 ? 1 : 0; 6678c2ecf20Sopenharmony_ci 6688c2ecf20Sopenharmony_ci return bytes; 6698c2ecf20Sopenharmony_ci} 6708c2ecf20Sopenharmony_ci 6718c2ecf20Sopenharmony_ci/* Complete SQ WR's without processing */ 6728c2ecf20Sopenharmony_cistatic int siw_sq_flush_wr(struct siw_qp *qp, const struct ib_send_wr *wr, 6738c2ecf20Sopenharmony_ci const struct ib_send_wr **bad_wr) 6748c2ecf20Sopenharmony_ci{ 6758c2ecf20Sopenharmony_ci int rv = 0; 6768c2ecf20Sopenharmony_ci 6778c2ecf20Sopenharmony_ci while (wr) { 6788c2ecf20Sopenharmony_ci struct siw_sqe sqe = {}; 6798c2ecf20Sopenharmony_ci 6808c2ecf20Sopenharmony_ci switch (wr->opcode) { 6818c2ecf20Sopenharmony_ci case IB_WR_RDMA_WRITE: 6828c2ecf20Sopenharmony_ci sqe.opcode = SIW_OP_WRITE; 6838c2ecf20Sopenharmony_ci break; 6848c2ecf20Sopenharmony_ci case IB_WR_RDMA_READ: 6858c2ecf20Sopenharmony_ci sqe.opcode = SIW_OP_READ; 6868c2ecf20Sopenharmony_ci break; 6878c2ecf20Sopenharmony_ci case IB_WR_RDMA_READ_WITH_INV: 6888c2ecf20Sopenharmony_ci sqe.opcode = SIW_OP_READ_LOCAL_INV; 6898c2ecf20Sopenharmony_ci break; 6908c2ecf20Sopenharmony_ci case IB_WR_SEND: 6918c2ecf20Sopenharmony_ci sqe.opcode = SIW_OP_SEND; 6928c2ecf20Sopenharmony_ci break; 6938c2ecf20Sopenharmony_ci case IB_WR_SEND_WITH_IMM: 6948c2ecf20Sopenharmony_ci sqe.opcode = SIW_OP_SEND_WITH_IMM; 6958c2ecf20Sopenharmony_ci break; 6968c2ecf20Sopenharmony_ci case IB_WR_SEND_WITH_INV: 6978c2ecf20Sopenharmony_ci sqe.opcode = SIW_OP_SEND_REMOTE_INV; 6988c2ecf20Sopenharmony_ci break; 6998c2ecf20Sopenharmony_ci case IB_WR_LOCAL_INV: 7008c2ecf20Sopenharmony_ci sqe.opcode = SIW_OP_INVAL_STAG; 7018c2ecf20Sopenharmony_ci break; 7028c2ecf20Sopenharmony_ci case IB_WR_REG_MR: 7038c2ecf20Sopenharmony_ci sqe.opcode = SIW_OP_REG_MR; 7048c2ecf20Sopenharmony_ci break; 7058c2ecf20Sopenharmony_ci default: 7068c2ecf20Sopenharmony_ci rv = -EINVAL; 7078c2ecf20Sopenharmony_ci break; 7088c2ecf20Sopenharmony_ci } 7098c2ecf20Sopenharmony_ci if (!rv) { 7108c2ecf20Sopenharmony_ci sqe.id = wr->wr_id; 7118c2ecf20Sopenharmony_ci rv = siw_sqe_complete(qp, &sqe, 0, 7128c2ecf20Sopenharmony_ci SIW_WC_WR_FLUSH_ERR); 7138c2ecf20Sopenharmony_ci } 7148c2ecf20Sopenharmony_ci if (rv) { 7158c2ecf20Sopenharmony_ci if (bad_wr) 7168c2ecf20Sopenharmony_ci *bad_wr = wr; 7178c2ecf20Sopenharmony_ci break; 7188c2ecf20Sopenharmony_ci } 7198c2ecf20Sopenharmony_ci wr = wr->next; 7208c2ecf20Sopenharmony_ci } 7218c2ecf20Sopenharmony_ci return rv; 7228c2ecf20Sopenharmony_ci} 7238c2ecf20Sopenharmony_ci 7248c2ecf20Sopenharmony_ci/* Complete RQ WR's without processing */ 7258c2ecf20Sopenharmony_cistatic int siw_rq_flush_wr(struct siw_qp *qp, const struct ib_recv_wr *wr, 7268c2ecf20Sopenharmony_ci const struct ib_recv_wr **bad_wr) 7278c2ecf20Sopenharmony_ci{ 7288c2ecf20Sopenharmony_ci struct siw_rqe rqe = {}; 7298c2ecf20Sopenharmony_ci int rv = 0; 7308c2ecf20Sopenharmony_ci 7318c2ecf20Sopenharmony_ci while (wr) { 7328c2ecf20Sopenharmony_ci rqe.id = wr->wr_id; 7338c2ecf20Sopenharmony_ci rv = siw_rqe_complete(qp, &rqe, 0, 0, SIW_WC_WR_FLUSH_ERR); 7348c2ecf20Sopenharmony_ci if (rv) { 7358c2ecf20Sopenharmony_ci if (bad_wr) 7368c2ecf20Sopenharmony_ci *bad_wr = wr; 7378c2ecf20Sopenharmony_ci break; 7388c2ecf20Sopenharmony_ci } 7398c2ecf20Sopenharmony_ci wr = wr->next; 7408c2ecf20Sopenharmony_ci } 7418c2ecf20Sopenharmony_ci return rv; 7428c2ecf20Sopenharmony_ci} 7438c2ecf20Sopenharmony_ci 7448c2ecf20Sopenharmony_ci/* 7458c2ecf20Sopenharmony_ci * siw_post_send() 7468c2ecf20Sopenharmony_ci * 7478c2ecf20Sopenharmony_ci * Post a list of S-WR's to a SQ. 7488c2ecf20Sopenharmony_ci * 7498c2ecf20Sopenharmony_ci * @base_qp: Base QP contained in siw QP 7508c2ecf20Sopenharmony_ci * @wr: Null terminated list of user WR's 7518c2ecf20Sopenharmony_ci * @bad_wr: Points to failing WR in case of synchronous failure. 7528c2ecf20Sopenharmony_ci */ 7538c2ecf20Sopenharmony_ciint siw_post_send(struct ib_qp *base_qp, const struct ib_send_wr *wr, 7548c2ecf20Sopenharmony_ci const struct ib_send_wr **bad_wr) 7558c2ecf20Sopenharmony_ci{ 7568c2ecf20Sopenharmony_ci struct siw_qp *qp = to_siw_qp(base_qp); 7578c2ecf20Sopenharmony_ci struct siw_wqe *wqe = tx_wqe(qp); 7588c2ecf20Sopenharmony_ci 7598c2ecf20Sopenharmony_ci unsigned long flags; 7608c2ecf20Sopenharmony_ci int rv = 0; 7618c2ecf20Sopenharmony_ci 7628c2ecf20Sopenharmony_ci if (wr && !rdma_is_kernel_res(&qp->base_qp.res)) { 7638c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "wr must be empty for user mapped sq\n"); 7648c2ecf20Sopenharmony_ci *bad_wr = wr; 7658c2ecf20Sopenharmony_ci return -EINVAL; 7668c2ecf20Sopenharmony_ci } 7678c2ecf20Sopenharmony_ci 7688c2ecf20Sopenharmony_ci /* 7698c2ecf20Sopenharmony_ci * Try to acquire QP state lock. Must be non-blocking 7708c2ecf20Sopenharmony_ci * to accommodate kernel clients needs. 7718c2ecf20Sopenharmony_ci */ 7728c2ecf20Sopenharmony_ci if (!down_read_trylock(&qp->state_lock)) { 7738c2ecf20Sopenharmony_ci if (qp->attrs.state == SIW_QP_STATE_ERROR) { 7748c2ecf20Sopenharmony_ci /* 7758c2ecf20Sopenharmony_ci * ERROR state is final, so we can be sure 7768c2ecf20Sopenharmony_ci * this state will not change as long as the QP 7778c2ecf20Sopenharmony_ci * exists. 7788c2ecf20Sopenharmony_ci * 7798c2ecf20Sopenharmony_ci * This handles an ib_drain_sq() call with 7808c2ecf20Sopenharmony_ci * a concurrent request to set the QP state 7818c2ecf20Sopenharmony_ci * to ERROR. 7828c2ecf20Sopenharmony_ci */ 7838c2ecf20Sopenharmony_ci rv = siw_sq_flush_wr(qp, wr, bad_wr); 7848c2ecf20Sopenharmony_ci } else { 7858c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "QP locked, state %d\n", 7868c2ecf20Sopenharmony_ci qp->attrs.state); 7878c2ecf20Sopenharmony_ci *bad_wr = wr; 7888c2ecf20Sopenharmony_ci rv = -ENOTCONN; 7898c2ecf20Sopenharmony_ci } 7908c2ecf20Sopenharmony_ci return rv; 7918c2ecf20Sopenharmony_ci } 7928c2ecf20Sopenharmony_ci if (unlikely(qp->attrs.state != SIW_QP_STATE_RTS)) { 7938c2ecf20Sopenharmony_ci if (qp->attrs.state == SIW_QP_STATE_ERROR) { 7948c2ecf20Sopenharmony_ci /* 7958c2ecf20Sopenharmony_ci * Immediately flush this WR to CQ, if QP 7968c2ecf20Sopenharmony_ci * is in ERROR state. SQ is guaranteed to 7978c2ecf20Sopenharmony_ci * be empty, so WR complets in-order. 7988c2ecf20Sopenharmony_ci * 7998c2ecf20Sopenharmony_ci * Typically triggered by ib_drain_sq(). 8008c2ecf20Sopenharmony_ci */ 8018c2ecf20Sopenharmony_ci rv = siw_sq_flush_wr(qp, wr, bad_wr); 8028c2ecf20Sopenharmony_ci } else { 8038c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "QP out of state %d\n", 8048c2ecf20Sopenharmony_ci qp->attrs.state); 8058c2ecf20Sopenharmony_ci *bad_wr = wr; 8068c2ecf20Sopenharmony_ci rv = -ENOTCONN; 8078c2ecf20Sopenharmony_ci } 8088c2ecf20Sopenharmony_ci up_read(&qp->state_lock); 8098c2ecf20Sopenharmony_ci return rv; 8108c2ecf20Sopenharmony_ci } 8118c2ecf20Sopenharmony_ci spin_lock_irqsave(&qp->sq_lock, flags); 8128c2ecf20Sopenharmony_ci 8138c2ecf20Sopenharmony_ci while (wr) { 8148c2ecf20Sopenharmony_ci u32 idx = qp->sq_put % qp->attrs.sq_size; 8158c2ecf20Sopenharmony_ci struct siw_sqe *sqe = &qp->sendq[idx]; 8168c2ecf20Sopenharmony_ci 8178c2ecf20Sopenharmony_ci if (sqe->flags) { 8188c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "sq full\n"); 8198c2ecf20Sopenharmony_ci rv = -ENOMEM; 8208c2ecf20Sopenharmony_ci break; 8218c2ecf20Sopenharmony_ci } 8228c2ecf20Sopenharmony_ci if (wr->num_sge > qp->attrs.sq_max_sges) { 8238c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "too many sge's: %d\n", wr->num_sge); 8248c2ecf20Sopenharmony_ci rv = -EINVAL; 8258c2ecf20Sopenharmony_ci break; 8268c2ecf20Sopenharmony_ci } 8278c2ecf20Sopenharmony_ci sqe->id = wr->wr_id; 8288c2ecf20Sopenharmony_ci 8298c2ecf20Sopenharmony_ci if ((wr->send_flags & IB_SEND_SIGNALED) || 8308c2ecf20Sopenharmony_ci (qp->attrs.flags & SIW_SIGNAL_ALL_WR)) 8318c2ecf20Sopenharmony_ci sqe->flags |= SIW_WQE_SIGNALLED; 8328c2ecf20Sopenharmony_ci 8338c2ecf20Sopenharmony_ci if (wr->send_flags & IB_SEND_FENCE) 8348c2ecf20Sopenharmony_ci sqe->flags |= SIW_WQE_READ_FENCE; 8358c2ecf20Sopenharmony_ci 8368c2ecf20Sopenharmony_ci switch (wr->opcode) { 8378c2ecf20Sopenharmony_ci case IB_WR_SEND: 8388c2ecf20Sopenharmony_ci case IB_WR_SEND_WITH_INV: 8398c2ecf20Sopenharmony_ci if (wr->send_flags & IB_SEND_SOLICITED) 8408c2ecf20Sopenharmony_ci sqe->flags |= SIW_WQE_SOLICITED; 8418c2ecf20Sopenharmony_ci 8428c2ecf20Sopenharmony_ci if (!(wr->send_flags & IB_SEND_INLINE)) { 8438c2ecf20Sopenharmony_ci siw_copy_sgl(wr->sg_list, sqe->sge, 8448c2ecf20Sopenharmony_ci wr->num_sge); 8458c2ecf20Sopenharmony_ci sqe->num_sge = wr->num_sge; 8468c2ecf20Sopenharmony_ci } else { 8478c2ecf20Sopenharmony_ci rv = siw_copy_inline_sgl(wr, sqe); 8488c2ecf20Sopenharmony_ci if (rv <= 0) { 8498c2ecf20Sopenharmony_ci rv = -EINVAL; 8508c2ecf20Sopenharmony_ci break; 8518c2ecf20Sopenharmony_ci } 8528c2ecf20Sopenharmony_ci sqe->flags |= SIW_WQE_INLINE; 8538c2ecf20Sopenharmony_ci sqe->num_sge = 1; 8548c2ecf20Sopenharmony_ci } 8558c2ecf20Sopenharmony_ci if (wr->opcode == IB_WR_SEND) 8568c2ecf20Sopenharmony_ci sqe->opcode = SIW_OP_SEND; 8578c2ecf20Sopenharmony_ci else { 8588c2ecf20Sopenharmony_ci sqe->opcode = SIW_OP_SEND_REMOTE_INV; 8598c2ecf20Sopenharmony_ci sqe->rkey = wr->ex.invalidate_rkey; 8608c2ecf20Sopenharmony_ci } 8618c2ecf20Sopenharmony_ci break; 8628c2ecf20Sopenharmony_ci 8638c2ecf20Sopenharmony_ci case IB_WR_RDMA_READ_WITH_INV: 8648c2ecf20Sopenharmony_ci case IB_WR_RDMA_READ: 8658c2ecf20Sopenharmony_ci /* 8668c2ecf20Sopenharmony_ci * iWarp restricts RREAD sink to SGL containing 8678c2ecf20Sopenharmony_ci * 1 SGE only. we could relax to SGL with multiple 8688c2ecf20Sopenharmony_ci * elements referring the SAME ltag or even sending 8698c2ecf20Sopenharmony_ci * a private per-rreq tag referring to a checked 8708c2ecf20Sopenharmony_ci * local sgl with MULTIPLE ltag's. 8718c2ecf20Sopenharmony_ci */ 8728c2ecf20Sopenharmony_ci if (unlikely(wr->num_sge != 1)) { 8738c2ecf20Sopenharmony_ci rv = -EINVAL; 8748c2ecf20Sopenharmony_ci break; 8758c2ecf20Sopenharmony_ci } 8768c2ecf20Sopenharmony_ci siw_copy_sgl(wr->sg_list, &sqe->sge[0], 1); 8778c2ecf20Sopenharmony_ci /* 8788c2ecf20Sopenharmony_ci * NOTE: zero length RREAD is allowed! 8798c2ecf20Sopenharmony_ci */ 8808c2ecf20Sopenharmony_ci sqe->raddr = rdma_wr(wr)->remote_addr; 8818c2ecf20Sopenharmony_ci sqe->rkey = rdma_wr(wr)->rkey; 8828c2ecf20Sopenharmony_ci sqe->num_sge = 1; 8838c2ecf20Sopenharmony_ci 8848c2ecf20Sopenharmony_ci if (wr->opcode == IB_WR_RDMA_READ) 8858c2ecf20Sopenharmony_ci sqe->opcode = SIW_OP_READ; 8868c2ecf20Sopenharmony_ci else 8878c2ecf20Sopenharmony_ci sqe->opcode = SIW_OP_READ_LOCAL_INV; 8888c2ecf20Sopenharmony_ci break; 8898c2ecf20Sopenharmony_ci 8908c2ecf20Sopenharmony_ci case IB_WR_RDMA_WRITE: 8918c2ecf20Sopenharmony_ci if (!(wr->send_flags & IB_SEND_INLINE)) { 8928c2ecf20Sopenharmony_ci siw_copy_sgl(wr->sg_list, &sqe->sge[0], 8938c2ecf20Sopenharmony_ci wr->num_sge); 8948c2ecf20Sopenharmony_ci sqe->num_sge = wr->num_sge; 8958c2ecf20Sopenharmony_ci } else { 8968c2ecf20Sopenharmony_ci rv = siw_copy_inline_sgl(wr, sqe); 8978c2ecf20Sopenharmony_ci if (unlikely(rv < 0)) { 8988c2ecf20Sopenharmony_ci rv = -EINVAL; 8998c2ecf20Sopenharmony_ci break; 9008c2ecf20Sopenharmony_ci } 9018c2ecf20Sopenharmony_ci sqe->flags |= SIW_WQE_INLINE; 9028c2ecf20Sopenharmony_ci sqe->num_sge = 1; 9038c2ecf20Sopenharmony_ci } 9048c2ecf20Sopenharmony_ci sqe->raddr = rdma_wr(wr)->remote_addr; 9058c2ecf20Sopenharmony_ci sqe->rkey = rdma_wr(wr)->rkey; 9068c2ecf20Sopenharmony_ci sqe->opcode = SIW_OP_WRITE; 9078c2ecf20Sopenharmony_ci break; 9088c2ecf20Sopenharmony_ci 9098c2ecf20Sopenharmony_ci case IB_WR_REG_MR: 9108c2ecf20Sopenharmony_ci sqe->base_mr = (uintptr_t)reg_wr(wr)->mr; 9118c2ecf20Sopenharmony_ci sqe->rkey = reg_wr(wr)->key; 9128c2ecf20Sopenharmony_ci sqe->access = reg_wr(wr)->access & IWARP_ACCESS_MASK; 9138c2ecf20Sopenharmony_ci sqe->opcode = SIW_OP_REG_MR; 9148c2ecf20Sopenharmony_ci break; 9158c2ecf20Sopenharmony_ci 9168c2ecf20Sopenharmony_ci case IB_WR_LOCAL_INV: 9178c2ecf20Sopenharmony_ci sqe->rkey = wr->ex.invalidate_rkey; 9188c2ecf20Sopenharmony_ci sqe->opcode = SIW_OP_INVAL_STAG; 9198c2ecf20Sopenharmony_ci break; 9208c2ecf20Sopenharmony_ci 9218c2ecf20Sopenharmony_ci default: 9228c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "ib wr type %d unsupported\n", 9238c2ecf20Sopenharmony_ci wr->opcode); 9248c2ecf20Sopenharmony_ci rv = -EINVAL; 9258c2ecf20Sopenharmony_ci break; 9268c2ecf20Sopenharmony_ci } 9278c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "opcode %d, flags 0x%x, wr_id 0x%pK\n", 9288c2ecf20Sopenharmony_ci sqe->opcode, sqe->flags, 9298c2ecf20Sopenharmony_ci (void *)(uintptr_t)sqe->id); 9308c2ecf20Sopenharmony_ci 9318c2ecf20Sopenharmony_ci if (unlikely(rv < 0)) 9328c2ecf20Sopenharmony_ci break; 9338c2ecf20Sopenharmony_ci 9348c2ecf20Sopenharmony_ci /* make SQE only valid after completely written */ 9358c2ecf20Sopenharmony_ci smp_wmb(); 9368c2ecf20Sopenharmony_ci sqe->flags |= SIW_WQE_VALID; 9378c2ecf20Sopenharmony_ci 9388c2ecf20Sopenharmony_ci qp->sq_put++; 9398c2ecf20Sopenharmony_ci wr = wr->next; 9408c2ecf20Sopenharmony_ci } 9418c2ecf20Sopenharmony_ci 9428c2ecf20Sopenharmony_ci /* 9438c2ecf20Sopenharmony_ci * Send directly if SQ processing is not in progress. 9448c2ecf20Sopenharmony_ci * Eventual immediate errors (rv < 0) do not affect the involved 9458c2ecf20Sopenharmony_ci * RI resources (Verbs, 8.3.1) and thus do not prevent from SQ 9468c2ecf20Sopenharmony_ci * processing, if new work is already pending. But rv must be passed 9478c2ecf20Sopenharmony_ci * to caller. 9488c2ecf20Sopenharmony_ci */ 9498c2ecf20Sopenharmony_ci if (wqe->wr_status != SIW_WR_IDLE) { 9508c2ecf20Sopenharmony_ci spin_unlock_irqrestore(&qp->sq_lock, flags); 9518c2ecf20Sopenharmony_ci goto skip_direct_sending; 9528c2ecf20Sopenharmony_ci } 9538c2ecf20Sopenharmony_ci rv = siw_activate_tx(qp); 9548c2ecf20Sopenharmony_ci spin_unlock_irqrestore(&qp->sq_lock, flags); 9558c2ecf20Sopenharmony_ci 9568c2ecf20Sopenharmony_ci if (rv <= 0) 9578c2ecf20Sopenharmony_ci goto skip_direct_sending; 9588c2ecf20Sopenharmony_ci 9598c2ecf20Sopenharmony_ci if (rdma_is_kernel_res(&qp->base_qp.res)) { 9608c2ecf20Sopenharmony_ci rv = siw_sq_start(qp); 9618c2ecf20Sopenharmony_ci } else { 9628c2ecf20Sopenharmony_ci qp->tx_ctx.in_syscall = 1; 9638c2ecf20Sopenharmony_ci 9648c2ecf20Sopenharmony_ci if (siw_qp_sq_process(qp) != 0 && !(qp->tx_ctx.tx_suspend)) 9658c2ecf20Sopenharmony_ci siw_qp_cm_drop(qp, 0); 9668c2ecf20Sopenharmony_ci 9678c2ecf20Sopenharmony_ci qp->tx_ctx.in_syscall = 0; 9688c2ecf20Sopenharmony_ci } 9698c2ecf20Sopenharmony_ciskip_direct_sending: 9708c2ecf20Sopenharmony_ci 9718c2ecf20Sopenharmony_ci up_read(&qp->state_lock); 9728c2ecf20Sopenharmony_ci 9738c2ecf20Sopenharmony_ci if (rv >= 0) 9748c2ecf20Sopenharmony_ci return 0; 9758c2ecf20Sopenharmony_ci /* 9768c2ecf20Sopenharmony_ci * Immediate error 9778c2ecf20Sopenharmony_ci */ 9788c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "error %d\n", rv); 9798c2ecf20Sopenharmony_ci 9808c2ecf20Sopenharmony_ci *bad_wr = wr; 9818c2ecf20Sopenharmony_ci return rv; 9828c2ecf20Sopenharmony_ci} 9838c2ecf20Sopenharmony_ci 9848c2ecf20Sopenharmony_ci/* 9858c2ecf20Sopenharmony_ci * siw_post_receive() 9868c2ecf20Sopenharmony_ci * 9878c2ecf20Sopenharmony_ci * Post a list of R-WR's to a RQ. 9888c2ecf20Sopenharmony_ci * 9898c2ecf20Sopenharmony_ci * @base_qp: Base QP contained in siw QP 9908c2ecf20Sopenharmony_ci * @wr: Null terminated list of user WR's 9918c2ecf20Sopenharmony_ci * @bad_wr: Points to failing WR in case of synchronous failure. 9928c2ecf20Sopenharmony_ci */ 9938c2ecf20Sopenharmony_ciint siw_post_receive(struct ib_qp *base_qp, const struct ib_recv_wr *wr, 9948c2ecf20Sopenharmony_ci const struct ib_recv_wr **bad_wr) 9958c2ecf20Sopenharmony_ci{ 9968c2ecf20Sopenharmony_ci struct siw_qp *qp = to_siw_qp(base_qp); 9978c2ecf20Sopenharmony_ci unsigned long flags; 9988c2ecf20Sopenharmony_ci int rv = 0; 9998c2ecf20Sopenharmony_ci 10008c2ecf20Sopenharmony_ci if (qp->srq || qp->attrs.rq_size == 0) { 10018c2ecf20Sopenharmony_ci *bad_wr = wr; 10028c2ecf20Sopenharmony_ci return -EINVAL; 10038c2ecf20Sopenharmony_ci } 10048c2ecf20Sopenharmony_ci if (!rdma_is_kernel_res(&qp->base_qp.res)) { 10058c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "no kernel post_recv for user mapped rq\n"); 10068c2ecf20Sopenharmony_ci *bad_wr = wr; 10078c2ecf20Sopenharmony_ci return -EINVAL; 10088c2ecf20Sopenharmony_ci } 10098c2ecf20Sopenharmony_ci 10108c2ecf20Sopenharmony_ci /* 10118c2ecf20Sopenharmony_ci * Try to acquire QP state lock. Must be non-blocking 10128c2ecf20Sopenharmony_ci * to accommodate kernel clients needs. 10138c2ecf20Sopenharmony_ci */ 10148c2ecf20Sopenharmony_ci if (!down_read_trylock(&qp->state_lock)) { 10158c2ecf20Sopenharmony_ci if (qp->attrs.state == SIW_QP_STATE_ERROR) { 10168c2ecf20Sopenharmony_ci /* 10178c2ecf20Sopenharmony_ci * ERROR state is final, so we can be sure 10188c2ecf20Sopenharmony_ci * this state will not change as long as the QP 10198c2ecf20Sopenharmony_ci * exists. 10208c2ecf20Sopenharmony_ci * 10218c2ecf20Sopenharmony_ci * This handles an ib_drain_rq() call with 10228c2ecf20Sopenharmony_ci * a concurrent request to set the QP state 10238c2ecf20Sopenharmony_ci * to ERROR. 10248c2ecf20Sopenharmony_ci */ 10258c2ecf20Sopenharmony_ci rv = siw_rq_flush_wr(qp, wr, bad_wr); 10268c2ecf20Sopenharmony_ci } else { 10278c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "QP locked, state %d\n", 10288c2ecf20Sopenharmony_ci qp->attrs.state); 10298c2ecf20Sopenharmony_ci *bad_wr = wr; 10308c2ecf20Sopenharmony_ci rv = -ENOTCONN; 10318c2ecf20Sopenharmony_ci } 10328c2ecf20Sopenharmony_ci return rv; 10338c2ecf20Sopenharmony_ci } 10348c2ecf20Sopenharmony_ci if (qp->attrs.state > SIW_QP_STATE_RTS) { 10358c2ecf20Sopenharmony_ci if (qp->attrs.state == SIW_QP_STATE_ERROR) { 10368c2ecf20Sopenharmony_ci /* 10378c2ecf20Sopenharmony_ci * Immediately flush this WR to CQ, if QP 10388c2ecf20Sopenharmony_ci * is in ERROR state. RQ is guaranteed to 10398c2ecf20Sopenharmony_ci * be empty, so WR complets in-order. 10408c2ecf20Sopenharmony_ci * 10418c2ecf20Sopenharmony_ci * Typically triggered by ib_drain_rq(). 10428c2ecf20Sopenharmony_ci */ 10438c2ecf20Sopenharmony_ci rv = siw_rq_flush_wr(qp, wr, bad_wr); 10448c2ecf20Sopenharmony_ci } else { 10458c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "QP out of state %d\n", 10468c2ecf20Sopenharmony_ci qp->attrs.state); 10478c2ecf20Sopenharmony_ci *bad_wr = wr; 10488c2ecf20Sopenharmony_ci rv = -ENOTCONN; 10498c2ecf20Sopenharmony_ci } 10508c2ecf20Sopenharmony_ci up_read(&qp->state_lock); 10518c2ecf20Sopenharmony_ci return rv; 10528c2ecf20Sopenharmony_ci } 10538c2ecf20Sopenharmony_ci /* 10548c2ecf20Sopenharmony_ci * Serialize potentially multiple producers. 10558c2ecf20Sopenharmony_ci * Not needed for single threaded consumer side. 10568c2ecf20Sopenharmony_ci */ 10578c2ecf20Sopenharmony_ci spin_lock_irqsave(&qp->rq_lock, flags); 10588c2ecf20Sopenharmony_ci 10598c2ecf20Sopenharmony_ci while (wr) { 10608c2ecf20Sopenharmony_ci u32 idx = qp->rq_put % qp->attrs.rq_size; 10618c2ecf20Sopenharmony_ci struct siw_rqe *rqe = &qp->recvq[idx]; 10628c2ecf20Sopenharmony_ci 10638c2ecf20Sopenharmony_ci if (rqe->flags) { 10648c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "RQ full\n"); 10658c2ecf20Sopenharmony_ci rv = -ENOMEM; 10668c2ecf20Sopenharmony_ci break; 10678c2ecf20Sopenharmony_ci } 10688c2ecf20Sopenharmony_ci if (wr->num_sge > qp->attrs.rq_max_sges) { 10698c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "too many sge's: %d\n", wr->num_sge); 10708c2ecf20Sopenharmony_ci rv = -EINVAL; 10718c2ecf20Sopenharmony_ci break; 10728c2ecf20Sopenharmony_ci } 10738c2ecf20Sopenharmony_ci rqe->id = wr->wr_id; 10748c2ecf20Sopenharmony_ci rqe->num_sge = wr->num_sge; 10758c2ecf20Sopenharmony_ci siw_copy_sgl(wr->sg_list, rqe->sge, wr->num_sge); 10768c2ecf20Sopenharmony_ci 10778c2ecf20Sopenharmony_ci /* make sure RQE is completely written before valid */ 10788c2ecf20Sopenharmony_ci smp_wmb(); 10798c2ecf20Sopenharmony_ci 10808c2ecf20Sopenharmony_ci rqe->flags = SIW_WQE_VALID; 10818c2ecf20Sopenharmony_ci 10828c2ecf20Sopenharmony_ci qp->rq_put++; 10838c2ecf20Sopenharmony_ci wr = wr->next; 10848c2ecf20Sopenharmony_ci } 10858c2ecf20Sopenharmony_ci spin_unlock_irqrestore(&qp->rq_lock, flags); 10868c2ecf20Sopenharmony_ci 10878c2ecf20Sopenharmony_ci up_read(&qp->state_lock); 10888c2ecf20Sopenharmony_ci 10898c2ecf20Sopenharmony_ci if (rv < 0) { 10908c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "error %d\n", rv); 10918c2ecf20Sopenharmony_ci *bad_wr = wr; 10928c2ecf20Sopenharmony_ci } 10938c2ecf20Sopenharmony_ci return rv > 0 ? 0 : rv; 10948c2ecf20Sopenharmony_ci} 10958c2ecf20Sopenharmony_ci 10968c2ecf20Sopenharmony_ciint siw_destroy_cq(struct ib_cq *base_cq, struct ib_udata *udata) 10978c2ecf20Sopenharmony_ci{ 10988c2ecf20Sopenharmony_ci struct siw_cq *cq = to_siw_cq(base_cq); 10998c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(base_cq->device); 11008c2ecf20Sopenharmony_ci struct siw_ucontext *ctx = 11018c2ecf20Sopenharmony_ci rdma_udata_to_drv_context(udata, struct siw_ucontext, 11028c2ecf20Sopenharmony_ci base_ucontext); 11038c2ecf20Sopenharmony_ci 11048c2ecf20Sopenharmony_ci siw_dbg_cq(cq, "free CQ resources\n"); 11058c2ecf20Sopenharmony_ci 11068c2ecf20Sopenharmony_ci siw_cq_flush(cq); 11078c2ecf20Sopenharmony_ci 11088c2ecf20Sopenharmony_ci if (ctx) 11098c2ecf20Sopenharmony_ci rdma_user_mmap_entry_remove(cq->cq_entry); 11108c2ecf20Sopenharmony_ci 11118c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_cq); 11128c2ecf20Sopenharmony_ci 11138c2ecf20Sopenharmony_ci vfree(cq->queue); 11148c2ecf20Sopenharmony_ci return 0; 11158c2ecf20Sopenharmony_ci} 11168c2ecf20Sopenharmony_ci 11178c2ecf20Sopenharmony_ci/* 11188c2ecf20Sopenharmony_ci * siw_create_cq() 11198c2ecf20Sopenharmony_ci * 11208c2ecf20Sopenharmony_ci * Populate CQ of requested size 11218c2ecf20Sopenharmony_ci * 11228c2ecf20Sopenharmony_ci * @base_cq: CQ as allocated by RDMA midlayer 11238c2ecf20Sopenharmony_ci * @attr: Initial CQ attributes 11248c2ecf20Sopenharmony_ci * @udata: relates to user context 11258c2ecf20Sopenharmony_ci */ 11268c2ecf20Sopenharmony_ci 11278c2ecf20Sopenharmony_ciint siw_create_cq(struct ib_cq *base_cq, const struct ib_cq_init_attr *attr, 11288c2ecf20Sopenharmony_ci struct ib_udata *udata) 11298c2ecf20Sopenharmony_ci{ 11308c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(base_cq->device); 11318c2ecf20Sopenharmony_ci struct siw_cq *cq = to_siw_cq(base_cq); 11328c2ecf20Sopenharmony_ci int rv, size = attr->cqe; 11338c2ecf20Sopenharmony_ci 11348c2ecf20Sopenharmony_ci if (atomic_inc_return(&sdev->num_cq) > SIW_MAX_CQ) { 11358c2ecf20Sopenharmony_ci siw_dbg(base_cq->device, "too many CQ's\n"); 11368c2ecf20Sopenharmony_ci rv = -ENOMEM; 11378c2ecf20Sopenharmony_ci goto err_out; 11388c2ecf20Sopenharmony_ci } 11398c2ecf20Sopenharmony_ci if (size < 1 || size > sdev->attrs.max_cqe) { 11408c2ecf20Sopenharmony_ci siw_dbg(base_cq->device, "CQ size error: %d\n", size); 11418c2ecf20Sopenharmony_ci rv = -EINVAL; 11428c2ecf20Sopenharmony_ci goto err_out; 11438c2ecf20Sopenharmony_ci } 11448c2ecf20Sopenharmony_ci size = roundup_pow_of_two(size); 11458c2ecf20Sopenharmony_ci cq->base_cq.cqe = size; 11468c2ecf20Sopenharmony_ci cq->num_cqe = size; 11478c2ecf20Sopenharmony_ci 11488c2ecf20Sopenharmony_ci if (udata) 11498c2ecf20Sopenharmony_ci cq->queue = vmalloc_user(size * sizeof(struct siw_cqe) + 11508c2ecf20Sopenharmony_ci sizeof(struct siw_cq_ctrl)); 11518c2ecf20Sopenharmony_ci else 11528c2ecf20Sopenharmony_ci cq->queue = vzalloc(size * sizeof(struct siw_cqe) + 11538c2ecf20Sopenharmony_ci sizeof(struct siw_cq_ctrl)); 11548c2ecf20Sopenharmony_ci 11558c2ecf20Sopenharmony_ci if (cq->queue == NULL) { 11568c2ecf20Sopenharmony_ci rv = -ENOMEM; 11578c2ecf20Sopenharmony_ci goto err_out; 11588c2ecf20Sopenharmony_ci } 11598c2ecf20Sopenharmony_ci get_random_bytes(&cq->id, 4); 11608c2ecf20Sopenharmony_ci siw_dbg(base_cq->device, "new CQ [%u]\n", cq->id); 11618c2ecf20Sopenharmony_ci 11628c2ecf20Sopenharmony_ci spin_lock_init(&cq->lock); 11638c2ecf20Sopenharmony_ci 11648c2ecf20Sopenharmony_ci cq->notify = (struct siw_cq_ctrl *)&cq->queue[size]; 11658c2ecf20Sopenharmony_ci 11668c2ecf20Sopenharmony_ci if (udata) { 11678c2ecf20Sopenharmony_ci struct siw_uresp_create_cq uresp = {}; 11688c2ecf20Sopenharmony_ci struct siw_ucontext *ctx = 11698c2ecf20Sopenharmony_ci rdma_udata_to_drv_context(udata, struct siw_ucontext, 11708c2ecf20Sopenharmony_ci base_ucontext); 11718c2ecf20Sopenharmony_ci size_t length = size * sizeof(struct siw_cqe) + 11728c2ecf20Sopenharmony_ci sizeof(struct siw_cq_ctrl); 11738c2ecf20Sopenharmony_ci 11748c2ecf20Sopenharmony_ci cq->cq_entry = 11758c2ecf20Sopenharmony_ci siw_mmap_entry_insert(ctx, cq->queue, 11768c2ecf20Sopenharmony_ci length, &uresp.cq_key); 11778c2ecf20Sopenharmony_ci if (!cq->cq_entry) { 11788c2ecf20Sopenharmony_ci rv = -ENOMEM; 11798c2ecf20Sopenharmony_ci goto err_out; 11808c2ecf20Sopenharmony_ci } 11818c2ecf20Sopenharmony_ci 11828c2ecf20Sopenharmony_ci uresp.cq_id = cq->id; 11838c2ecf20Sopenharmony_ci uresp.num_cqe = size; 11848c2ecf20Sopenharmony_ci 11858c2ecf20Sopenharmony_ci if (udata->outlen < sizeof(uresp)) { 11868c2ecf20Sopenharmony_ci rv = -EINVAL; 11878c2ecf20Sopenharmony_ci goto err_out; 11888c2ecf20Sopenharmony_ci } 11898c2ecf20Sopenharmony_ci rv = ib_copy_to_udata(udata, &uresp, sizeof(uresp)); 11908c2ecf20Sopenharmony_ci if (rv) 11918c2ecf20Sopenharmony_ci goto err_out; 11928c2ecf20Sopenharmony_ci } 11938c2ecf20Sopenharmony_ci return 0; 11948c2ecf20Sopenharmony_ci 11958c2ecf20Sopenharmony_cierr_out: 11968c2ecf20Sopenharmony_ci siw_dbg(base_cq->device, "CQ creation failed: %d", rv); 11978c2ecf20Sopenharmony_ci 11988c2ecf20Sopenharmony_ci if (cq && cq->queue) { 11998c2ecf20Sopenharmony_ci struct siw_ucontext *ctx = 12008c2ecf20Sopenharmony_ci rdma_udata_to_drv_context(udata, struct siw_ucontext, 12018c2ecf20Sopenharmony_ci base_ucontext); 12028c2ecf20Sopenharmony_ci if (ctx) 12038c2ecf20Sopenharmony_ci rdma_user_mmap_entry_remove(cq->cq_entry); 12048c2ecf20Sopenharmony_ci vfree(cq->queue); 12058c2ecf20Sopenharmony_ci } 12068c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_cq); 12078c2ecf20Sopenharmony_ci 12088c2ecf20Sopenharmony_ci return rv; 12098c2ecf20Sopenharmony_ci} 12108c2ecf20Sopenharmony_ci 12118c2ecf20Sopenharmony_ci/* 12128c2ecf20Sopenharmony_ci * siw_poll_cq() 12138c2ecf20Sopenharmony_ci * 12148c2ecf20Sopenharmony_ci * Reap CQ entries if available and copy work completion status into 12158c2ecf20Sopenharmony_ci * array of WC's provided by caller. Returns number of reaped CQE's. 12168c2ecf20Sopenharmony_ci * 12178c2ecf20Sopenharmony_ci * @base_cq: Base CQ contained in siw CQ. 12188c2ecf20Sopenharmony_ci * @num_cqe: Maximum number of CQE's to reap. 12198c2ecf20Sopenharmony_ci * @wc: Array of work completions to be filled by siw. 12208c2ecf20Sopenharmony_ci */ 12218c2ecf20Sopenharmony_ciint siw_poll_cq(struct ib_cq *base_cq, int num_cqe, struct ib_wc *wc) 12228c2ecf20Sopenharmony_ci{ 12238c2ecf20Sopenharmony_ci struct siw_cq *cq = to_siw_cq(base_cq); 12248c2ecf20Sopenharmony_ci int i; 12258c2ecf20Sopenharmony_ci 12268c2ecf20Sopenharmony_ci for (i = 0; i < num_cqe; i++) { 12278c2ecf20Sopenharmony_ci if (!siw_reap_cqe(cq, wc)) 12288c2ecf20Sopenharmony_ci break; 12298c2ecf20Sopenharmony_ci wc++; 12308c2ecf20Sopenharmony_ci } 12318c2ecf20Sopenharmony_ci return i; 12328c2ecf20Sopenharmony_ci} 12338c2ecf20Sopenharmony_ci 12348c2ecf20Sopenharmony_ci/* 12358c2ecf20Sopenharmony_ci * siw_req_notify_cq() 12368c2ecf20Sopenharmony_ci * 12378c2ecf20Sopenharmony_ci * Request notification for new CQE's added to that CQ. 12388c2ecf20Sopenharmony_ci * Defined flags: 12398c2ecf20Sopenharmony_ci * o SIW_CQ_NOTIFY_SOLICITED lets siw trigger a notification 12408c2ecf20Sopenharmony_ci * event if a WQE with notification flag set enters the CQ 12418c2ecf20Sopenharmony_ci * o SIW_CQ_NOTIFY_NEXT_COMP lets siw trigger a notification 12428c2ecf20Sopenharmony_ci * event if a WQE enters the CQ. 12438c2ecf20Sopenharmony_ci * o IB_CQ_REPORT_MISSED_EVENTS: return value will provide the 12448c2ecf20Sopenharmony_ci * number of not reaped CQE's regardless of its notification 12458c2ecf20Sopenharmony_ci * type and current or new CQ notification settings. 12468c2ecf20Sopenharmony_ci * 12478c2ecf20Sopenharmony_ci * @base_cq: Base CQ contained in siw CQ. 12488c2ecf20Sopenharmony_ci * @flags: Requested notification flags. 12498c2ecf20Sopenharmony_ci */ 12508c2ecf20Sopenharmony_ciint siw_req_notify_cq(struct ib_cq *base_cq, enum ib_cq_notify_flags flags) 12518c2ecf20Sopenharmony_ci{ 12528c2ecf20Sopenharmony_ci struct siw_cq *cq = to_siw_cq(base_cq); 12538c2ecf20Sopenharmony_ci 12548c2ecf20Sopenharmony_ci siw_dbg_cq(cq, "flags: 0x%02x\n", flags); 12558c2ecf20Sopenharmony_ci 12568c2ecf20Sopenharmony_ci if ((flags & IB_CQ_SOLICITED_MASK) == IB_CQ_SOLICITED) 12578c2ecf20Sopenharmony_ci /* 12588c2ecf20Sopenharmony_ci * Enable CQ event for next solicited completion. 12598c2ecf20Sopenharmony_ci * and make it visible to all associated producers. 12608c2ecf20Sopenharmony_ci */ 12618c2ecf20Sopenharmony_ci smp_store_mb(cq->notify->flags, SIW_NOTIFY_SOLICITED); 12628c2ecf20Sopenharmony_ci else 12638c2ecf20Sopenharmony_ci /* 12648c2ecf20Sopenharmony_ci * Enable CQ event for any signalled completion. 12658c2ecf20Sopenharmony_ci * and make it visible to all associated producers. 12668c2ecf20Sopenharmony_ci */ 12678c2ecf20Sopenharmony_ci smp_store_mb(cq->notify->flags, SIW_NOTIFY_ALL); 12688c2ecf20Sopenharmony_ci 12698c2ecf20Sopenharmony_ci if (flags & IB_CQ_REPORT_MISSED_EVENTS) 12708c2ecf20Sopenharmony_ci return cq->cq_put - cq->cq_get; 12718c2ecf20Sopenharmony_ci 12728c2ecf20Sopenharmony_ci return 0; 12738c2ecf20Sopenharmony_ci} 12748c2ecf20Sopenharmony_ci 12758c2ecf20Sopenharmony_ci/* 12768c2ecf20Sopenharmony_ci * siw_dereg_mr() 12778c2ecf20Sopenharmony_ci * 12788c2ecf20Sopenharmony_ci * Release Memory Region. 12798c2ecf20Sopenharmony_ci * 12808c2ecf20Sopenharmony_ci * @base_mr: Base MR contained in siw MR. 12818c2ecf20Sopenharmony_ci * @udata: points to user context, unused. 12828c2ecf20Sopenharmony_ci */ 12838c2ecf20Sopenharmony_ciint siw_dereg_mr(struct ib_mr *base_mr, struct ib_udata *udata) 12848c2ecf20Sopenharmony_ci{ 12858c2ecf20Sopenharmony_ci struct siw_mr *mr = to_siw_mr(base_mr); 12868c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(base_mr->device); 12878c2ecf20Sopenharmony_ci 12888c2ecf20Sopenharmony_ci siw_dbg_mem(mr->mem, "deregister MR\n"); 12898c2ecf20Sopenharmony_ci 12908c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_mr); 12918c2ecf20Sopenharmony_ci 12928c2ecf20Sopenharmony_ci siw_mr_drop_mem(mr); 12938c2ecf20Sopenharmony_ci kfree_rcu(mr, rcu); 12948c2ecf20Sopenharmony_ci 12958c2ecf20Sopenharmony_ci return 0; 12968c2ecf20Sopenharmony_ci} 12978c2ecf20Sopenharmony_ci 12988c2ecf20Sopenharmony_ci/* 12998c2ecf20Sopenharmony_ci * siw_reg_user_mr() 13008c2ecf20Sopenharmony_ci * 13018c2ecf20Sopenharmony_ci * Register Memory Region. 13028c2ecf20Sopenharmony_ci * 13038c2ecf20Sopenharmony_ci * @pd: Protection Domain 13048c2ecf20Sopenharmony_ci * @start: starting address of MR (virtual address) 13058c2ecf20Sopenharmony_ci * @len: len of MR 13068c2ecf20Sopenharmony_ci * @rnic_va: not used by siw 13078c2ecf20Sopenharmony_ci * @rights: MR access rights 13088c2ecf20Sopenharmony_ci * @udata: user buffer to communicate STag and Key. 13098c2ecf20Sopenharmony_ci */ 13108c2ecf20Sopenharmony_cistruct ib_mr *siw_reg_user_mr(struct ib_pd *pd, u64 start, u64 len, 13118c2ecf20Sopenharmony_ci u64 rnic_va, int rights, struct ib_udata *udata) 13128c2ecf20Sopenharmony_ci{ 13138c2ecf20Sopenharmony_ci struct siw_mr *mr = NULL; 13148c2ecf20Sopenharmony_ci struct siw_umem *umem = NULL; 13158c2ecf20Sopenharmony_ci struct siw_ureq_reg_mr ureq; 13168c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(pd->device); 13178c2ecf20Sopenharmony_ci 13188c2ecf20Sopenharmony_ci unsigned long mem_limit = rlimit(RLIMIT_MEMLOCK); 13198c2ecf20Sopenharmony_ci int rv; 13208c2ecf20Sopenharmony_ci 13218c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "start: 0x%pK, va: 0x%pK, len: %llu\n", 13228c2ecf20Sopenharmony_ci (void *)(uintptr_t)start, (void *)(uintptr_t)rnic_va, 13238c2ecf20Sopenharmony_ci (unsigned long long)len); 13248c2ecf20Sopenharmony_ci 13258c2ecf20Sopenharmony_ci if (atomic_inc_return(&sdev->num_mr) > SIW_MAX_MR) { 13268c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "too many mr's\n"); 13278c2ecf20Sopenharmony_ci rv = -ENOMEM; 13288c2ecf20Sopenharmony_ci goto err_out; 13298c2ecf20Sopenharmony_ci } 13308c2ecf20Sopenharmony_ci if (!len) { 13318c2ecf20Sopenharmony_ci rv = -EINVAL; 13328c2ecf20Sopenharmony_ci goto err_out; 13338c2ecf20Sopenharmony_ci } 13348c2ecf20Sopenharmony_ci if (mem_limit != RLIM_INFINITY) { 13358c2ecf20Sopenharmony_ci unsigned long num_pages = 13368c2ecf20Sopenharmony_ci (PAGE_ALIGN(len + (start & ~PAGE_MASK))) >> PAGE_SHIFT; 13378c2ecf20Sopenharmony_ci mem_limit >>= PAGE_SHIFT; 13388c2ecf20Sopenharmony_ci 13398c2ecf20Sopenharmony_ci if (num_pages > mem_limit - current->mm->locked_vm) { 13408c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "pages req %lu, max %lu, lock %lu\n", 13418c2ecf20Sopenharmony_ci num_pages, mem_limit, 13428c2ecf20Sopenharmony_ci current->mm->locked_vm); 13438c2ecf20Sopenharmony_ci rv = -ENOMEM; 13448c2ecf20Sopenharmony_ci goto err_out; 13458c2ecf20Sopenharmony_ci } 13468c2ecf20Sopenharmony_ci } 13478c2ecf20Sopenharmony_ci umem = siw_umem_get(start, len, ib_access_writable(rights)); 13488c2ecf20Sopenharmony_ci if (IS_ERR(umem)) { 13498c2ecf20Sopenharmony_ci rv = PTR_ERR(umem); 13508c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "getting user memory failed: %d\n", rv); 13518c2ecf20Sopenharmony_ci umem = NULL; 13528c2ecf20Sopenharmony_ci goto err_out; 13538c2ecf20Sopenharmony_ci } 13548c2ecf20Sopenharmony_ci mr = kzalloc(sizeof(*mr), GFP_KERNEL); 13558c2ecf20Sopenharmony_ci if (!mr) { 13568c2ecf20Sopenharmony_ci rv = -ENOMEM; 13578c2ecf20Sopenharmony_ci goto err_out; 13588c2ecf20Sopenharmony_ci } 13598c2ecf20Sopenharmony_ci rv = siw_mr_add_mem(mr, pd, umem, start, len, rights); 13608c2ecf20Sopenharmony_ci if (rv) 13618c2ecf20Sopenharmony_ci goto err_out; 13628c2ecf20Sopenharmony_ci 13638c2ecf20Sopenharmony_ci if (udata) { 13648c2ecf20Sopenharmony_ci struct siw_uresp_reg_mr uresp = {}; 13658c2ecf20Sopenharmony_ci struct siw_mem *mem = mr->mem; 13668c2ecf20Sopenharmony_ci 13678c2ecf20Sopenharmony_ci if (udata->inlen < sizeof(ureq)) { 13688c2ecf20Sopenharmony_ci rv = -EINVAL; 13698c2ecf20Sopenharmony_ci goto err_out; 13708c2ecf20Sopenharmony_ci } 13718c2ecf20Sopenharmony_ci rv = ib_copy_from_udata(&ureq, udata, sizeof(ureq)); 13728c2ecf20Sopenharmony_ci if (rv) 13738c2ecf20Sopenharmony_ci goto err_out; 13748c2ecf20Sopenharmony_ci 13758c2ecf20Sopenharmony_ci mr->base_mr.lkey |= ureq.stag_key; 13768c2ecf20Sopenharmony_ci mr->base_mr.rkey |= ureq.stag_key; 13778c2ecf20Sopenharmony_ci mem->stag |= ureq.stag_key; 13788c2ecf20Sopenharmony_ci uresp.stag = mem->stag; 13798c2ecf20Sopenharmony_ci 13808c2ecf20Sopenharmony_ci if (udata->outlen < sizeof(uresp)) { 13818c2ecf20Sopenharmony_ci rv = -EINVAL; 13828c2ecf20Sopenharmony_ci goto err_out; 13838c2ecf20Sopenharmony_ci } 13848c2ecf20Sopenharmony_ci rv = ib_copy_to_udata(udata, &uresp, sizeof(uresp)); 13858c2ecf20Sopenharmony_ci if (rv) 13868c2ecf20Sopenharmony_ci goto err_out; 13878c2ecf20Sopenharmony_ci } 13888c2ecf20Sopenharmony_ci mr->mem->stag_valid = 1; 13898c2ecf20Sopenharmony_ci 13908c2ecf20Sopenharmony_ci return &mr->base_mr; 13918c2ecf20Sopenharmony_ci 13928c2ecf20Sopenharmony_cierr_out: 13938c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_mr); 13948c2ecf20Sopenharmony_ci if (mr) { 13958c2ecf20Sopenharmony_ci if (mr->mem) 13968c2ecf20Sopenharmony_ci siw_mr_drop_mem(mr); 13978c2ecf20Sopenharmony_ci kfree_rcu(mr, rcu); 13988c2ecf20Sopenharmony_ci } else { 13998c2ecf20Sopenharmony_ci if (umem) 14008c2ecf20Sopenharmony_ci siw_umem_release(umem, false); 14018c2ecf20Sopenharmony_ci } 14028c2ecf20Sopenharmony_ci return ERR_PTR(rv); 14038c2ecf20Sopenharmony_ci} 14048c2ecf20Sopenharmony_ci 14058c2ecf20Sopenharmony_cistruct ib_mr *siw_alloc_mr(struct ib_pd *pd, enum ib_mr_type mr_type, 14068c2ecf20Sopenharmony_ci u32 max_sge) 14078c2ecf20Sopenharmony_ci{ 14088c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(pd->device); 14098c2ecf20Sopenharmony_ci struct siw_mr *mr = NULL; 14108c2ecf20Sopenharmony_ci struct siw_pbl *pbl = NULL; 14118c2ecf20Sopenharmony_ci int rv; 14128c2ecf20Sopenharmony_ci 14138c2ecf20Sopenharmony_ci if (atomic_inc_return(&sdev->num_mr) > SIW_MAX_MR) { 14148c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "too many mr's\n"); 14158c2ecf20Sopenharmony_ci rv = -ENOMEM; 14168c2ecf20Sopenharmony_ci goto err_out; 14178c2ecf20Sopenharmony_ci } 14188c2ecf20Sopenharmony_ci if (mr_type != IB_MR_TYPE_MEM_REG) { 14198c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "mr type %d unsupported\n", mr_type); 14208c2ecf20Sopenharmony_ci rv = -EOPNOTSUPP; 14218c2ecf20Sopenharmony_ci goto err_out; 14228c2ecf20Sopenharmony_ci } 14238c2ecf20Sopenharmony_ci if (max_sge > SIW_MAX_SGE_PBL) { 14248c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "too many sge's: %d\n", max_sge); 14258c2ecf20Sopenharmony_ci rv = -ENOMEM; 14268c2ecf20Sopenharmony_ci goto err_out; 14278c2ecf20Sopenharmony_ci } 14288c2ecf20Sopenharmony_ci pbl = siw_pbl_alloc(max_sge); 14298c2ecf20Sopenharmony_ci if (IS_ERR(pbl)) { 14308c2ecf20Sopenharmony_ci rv = PTR_ERR(pbl); 14318c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "pbl allocation failed: %d\n", rv); 14328c2ecf20Sopenharmony_ci pbl = NULL; 14338c2ecf20Sopenharmony_ci goto err_out; 14348c2ecf20Sopenharmony_ci } 14358c2ecf20Sopenharmony_ci mr = kzalloc(sizeof(*mr), GFP_KERNEL); 14368c2ecf20Sopenharmony_ci if (!mr) { 14378c2ecf20Sopenharmony_ci rv = -ENOMEM; 14388c2ecf20Sopenharmony_ci goto err_out; 14398c2ecf20Sopenharmony_ci } 14408c2ecf20Sopenharmony_ci rv = siw_mr_add_mem(mr, pd, pbl, 0, max_sge * PAGE_SIZE, 0); 14418c2ecf20Sopenharmony_ci if (rv) 14428c2ecf20Sopenharmony_ci goto err_out; 14438c2ecf20Sopenharmony_ci 14448c2ecf20Sopenharmony_ci mr->mem->is_pbl = 1; 14458c2ecf20Sopenharmony_ci 14468c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "[MEM %u]: success\n", mr->mem->stag); 14478c2ecf20Sopenharmony_ci 14488c2ecf20Sopenharmony_ci return &mr->base_mr; 14498c2ecf20Sopenharmony_ci 14508c2ecf20Sopenharmony_cierr_out: 14518c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_mr); 14528c2ecf20Sopenharmony_ci 14538c2ecf20Sopenharmony_ci if (!mr) { 14548c2ecf20Sopenharmony_ci kfree(pbl); 14558c2ecf20Sopenharmony_ci } else { 14568c2ecf20Sopenharmony_ci if (mr->mem) 14578c2ecf20Sopenharmony_ci siw_mr_drop_mem(mr); 14588c2ecf20Sopenharmony_ci kfree_rcu(mr, rcu); 14598c2ecf20Sopenharmony_ci } 14608c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "failed: %d\n", rv); 14618c2ecf20Sopenharmony_ci 14628c2ecf20Sopenharmony_ci return ERR_PTR(rv); 14638c2ecf20Sopenharmony_ci} 14648c2ecf20Sopenharmony_ci 14658c2ecf20Sopenharmony_ci/* Just used to count number of pages being mapped */ 14668c2ecf20Sopenharmony_cistatic int siw_set_pbl_page(struct ib_mr *base_mr, u64 buf_addr) 14678c2ecf20Sopenharmony_ci{ 14688c2ecf20Sopenharmony_ci return 0; 14698c2ecf20Sopenharmony_ci} 14708c2ecf20Sopenharmony_ci 14718c2ecf20Sopenharmony_ciint siw_map_mr_sg(struct ib_mr *base_mr, struct scatterlist *sl, int num_sle, 14728c2ecf20Sopenharmony_ci unsigned int *sg_off) 14738c2ecf20Sopenharmony_ci{ 14748c2ecf20Sopenharmony_ci struct scatterlist *slp; 14758c2ecf20Sopenharmony_ci struct siw_mr *mr = to_siw_mr(base_mr); 14768c2ecf20Sopenharmony_ci struct siw_mem *mem = mr->mem; 14778c2ecf20Sopenharmony_ci struct siw_pbl *pbl = mem->pbl; 14788c2ecf20Sopenharmony_ci struct siw_pble *pble; 14798c2ecf20Sopenharmony_ci unsigned long pbl_size; 14808c2ecf20Sopenharmony_ci int i, rv; 14818c2ecf20Sopenharmony_ci 14828c2ecf20Sopenharmony_ci if (!pbl) { 14838c2ecf20Sopenharmony_ci siw_dbg_mem(mem, "no PBL allocated\n"); 14848c2ecf20Sopenharmony_ci return -EINVAL; 14858c2ecf20Sopenharmony_ci } 14868c2ecf20Sopenharmony_ci pble = pbl->pbe; 14878c2ecf20Sopenharmony_ci 14888c2ecf20Sopenharmony_ci if (pbl->max_buf < num_sle) { 14898c2ecf20Sopenharmony_ci siw_dbg_mem(mem, "too many SGE's: %d > %d\n", 14908c2ecf20Sopenharmony_ci num_sle, pbl->max_buf); 14918c2ecf20Sopenharmony_ci return -ENOMEM; 14928c2ecf20Sopenharmony_ci } 14938c2ecf20Sopenharmony_ci for_each_sg(sl, slp, num_sle, i) { 14948c2ecf20Sopenharmony_ci if (sg_dma_len(slp) == 0) { 14958c2ecf20Sopenharmony_ci siw_dbg_mem(mem, "empty SGE\n"); 14968c2ecf20Sopenharmony_ci return -EINVAL; 14978c2ecf20Sopenharmony_ci } 14988c2ecf20Sopenharmony_ci if (i == 0) { 14998c2ecf20Sopenharmony_ci pble->addr = sg_dma_address(slp); 15008c2ecf20Sopenharmony_ci pble->size = sg_dma_len(slp); 15018c2ecf20Sopenharmony_ci pble->pbl_off = 0; 15028c2ecf20Sopenharmony_ci pbl_size = pble->size; 15038c2ecf20Sopenharmony_ci pbl->num_buf = 1; 15048c2ecf20Sopenharmony_ci } else { 15058c2ecf20Sopenharmony_ci /* Merge PBL entries if adjacent */ 15068c2ecf20Sopenharmony_ci if (pble->addr + pble->size == sg_dma_address(slp)) { 15078c2ecf20Sopenharmony_ci pble->size += sg_dma_len(slp); 15088c2ecf20Sopenharmony_ci } else { 15098c2ecf20Sopenharmony_ci pble++; 15108c2ecf20Sopenharmony_ci pbl->num_buf++; 15118c2ecf20Sopenharmony_ci pble->addr = sg_dma_address(slp); 15128c2ecf20Sopenharmony_ci pble->size = sg_dma_len(slp); 15138c2ecf20Sopenharmony_ci pble->pbl_off = pbl_size; 15148c2ecf20Sopenharmony_ci } 15158c2ecf20Sopenharmony_ci pbl_size += sg_dma_len(slp); 15168c2ecf20Sopenharmony_ci } 15178c2ecf20Sopenharmony_ci siw_dbg_mem(mem, 15188c2ecf20Sopenharmony_ci "sge[%d], size %u, addr 0x%p, total %lu\n", 15198c2ecf20Sopenharmony_ci i, pble->size, (void *)(uintptr_t)pble->addr, 15208c2ecf20Sopenharmony_ci pbl_size); 15218c2ecf20Sopenharmony_ci } 15228c2ecf20Sopenharmony_ci rv = ib_sg_to_pages(base_mr, sl, num_sle, sg_off, siw_set_pbl_page); 15238c2ecf20Sopenharmony_ci if (rv > 0) { 15248c2ecf20Sopenharmony_ci mem->len = base_mr->length; 15258c2ecf20Sopenharmony_ci mem->va = base_mr->iova; 15268c2ecf20Sopenharmony_ci siw_dbg_mem(mem, 15278c2ecf20Sopenharmony_ci "%llu bytes, start 0x%pK, %u SLE to %u entries\n", 15288c2ecf20Sopenharmony_ci mem->len, (void *)(uintptr_t)mem->va, num_sle, 15298c2ecf20Sopenharmony_ci pbl->num_buf); 15308c2ecf20Sopenharmony_ci } 15318c2ecf20Sopenharmony_ci return rv; 15328c2ecf20Sopenharmony_ci} 15338c2ecf20Sopenharmony_ci 15348c2ecf20Sopenharmony_ci/* 15358c2ecf20Sopenharmony_ci * siw_get_dma_mr() 15368c2ecf20Sopenharmony_ci * 15378c2ecf20Sopenharmony_ci * Create a (empty) DMA memory region, where no umem is attached. 15388c2ecf20Sopenharmony_ci */ 15398c2ecf20Sopenharmony_cistruct ib_mr *siw_get_dma_mr(struct ib_pd *pd, int rights) 15408c2ecf20Sopenharmony_ci{ 15418c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(pd->device); 15428c2ecf20Sopenharmony_ci struct siw_mr *mr = NULL; 15438c2ecf20Sopenharmony_ci int rv; 15448c2ecf20Sopenharmony_ci 15458c2ecf20Sopenharmony_ci if (atomic_inc_return(&sdev->num_mr) > SIW_MAX_MR) { 15468c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "too many mr's\n"); 15478c2ecf20Sopenharmony_ci rv = -ENOMEM; 15488c2ecf20Sopenharmony_ci goto err_out; 15498c2ecf20Sopenharmony_ci } 15508c2ecf20Sopenharmony_ci mr = kzalloc(sizeof(*mr), GFP_KERNEL); 15518c2ecf20Sopenharmony_ci if (!mr) { 15528c2ecf20Sopenharmony_ci rv = -ENOMEM; 15538c2ecf20Sopenharmony_ci goto err_out; 15548c2ecf20Sopenharmony_ci } 15558c2ecf20Sopenharmony_ci rv = siw_mr_add_mem(mr, pd, NULL, 0, ULONG_MAX, rights); 15568c2ecf20Sopenharmony_ci if (rv) 15578c2ecf20Sopenharmony_ci goto err_out; 15588c2ecf20Sopenharmony_ci 15598c2ecf20Sopenharmony_ci mr->mem->stag_valid = 1; 15608c2ecf20Sopenharmony_ci 15618c2ecf20Sopenharmony_ci siw_dbg_pd(pd, "[MEM %u]: success\n", mr->mem->stag); 15628c2ecf20Sopenharmony_ci 15638c2ecf20Sopenharmony_ci return &mr->base_mr; 15648c2ecf20Sopenharmony_ci 15658c2ecf20Sopenharmony_cierr_out: 15668c2ecf20Sopenharmony_ci if (rv) 15678c2ecf20Sopenharmony_ci kfree(mr); 15688c2ecf20Sopenharmony_ci 15698c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_mr); 15708c2ecf20Sopenharmony_ci 15718c2ecf20Sopenharmony_ci return ERR_PTR(rv); 15728c2ecf20Sopenharmony_ci} 15738c2ecf20Sopenharmony_ci 15748c2ecf20Sopenharmony_ci/* 15758c2ecf20Sopenharmony_ci * siw_create_srq() 15768c2ecf20Sopenharmony_ci * 15778c2ecf20Sopenharmony_ci * Create Shared Receive Queue of attributes @init_attrs 15788c2ecf20Sopenharmony_ci * within protection domain given by @pd. 15798c2ecf20Sopenharmony_ci * 15808c2ecf20Sopenharmony_ci * @base_srq: Base SRQ contained in siw SRQ. 15818c2ecf20Sopenharmony_ci * @init_attrs: SRQ init attributes. 15828c2ecf20Sopenharmony_ci * @udata: points to user context 15838c2ecf20Sopenharmony_ci */ 15848c2ecf20Sopenharmony_ciint siw_create_srq(struct ib_srq *base_srq, 15858c2ecf20Sopenharmony_ci struct ib_srq_init_attr *init_attrs, struct ib_udata *udata) 15868c2ecf20Sopenharmony_ci{ 15878c2ecf20Sopenharmony_ci struct siw_srq *srq = to_siw_srq(base_srq); 15888c2ecf20Sopenharmony_ci struct ib_srq_attr *attrs = &init_attrs->attr; 15898c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(base_srq->device); 15908c2ecf20Sopenharmony_ci struct siw_ucontext *ctx = 15918c2ecf20Sopenharmony_ci rdma_udata_to_drv_context(udata, struct siw_ucontext, 15928c2ecf20Sopenharmony_ci base_ucontext); 15938c2ecf20Sopenharmony_ci int rv; 15948c2ecf20Sopenharmony_ci 15958c2ecf20Sopenharmony_ci if (atomic_inc_return(&sdev->num_srq) > SIW_MAX_SRQ) { 15968c2ecf20Sopenharmony_ci siw_dbg_pd(base_srq->pd, "too many SRQ's\n"); 15978c2ecf20Sopenharmony_ci rv = -ENOMEM; 15988c2ecf20Sopenharmony_ci goto err_out; 15998c2ecf20Sopenharmony_ci } 16008c2ecf20Sopenharmony_ci if (attrs->max_wr == 0 || attrs->max_wr > SIW_MAX_SRQ_WR || 16018c2ecf20Sopenharmony_ci attrs->max_sge > SIW_MAX_SGE || attrs->srq_limit > attrs->max_wr) { 16028c2ecf20Sopenharmony_ci rv = -EINVAL; 16038c2ecf20Sopenharmony_ci goto err_out; 16048c2ecf20Sopenharmony_ci } 16058c2ecf20Sopenharmony_ci srq->max_sge = attrs->max_sge; 16068c2ecf20Sopenharmony_ci srq->num_rqe = roundup_pow_of_two(attrs->max_wr); 16078c2ecf20Sopenharmony_ci srq->limit = attrs->srq_limit; 16088c2ecf20Sopenharmony_ci if (srq->limit) 16098c2ecf20Sopenharmony_ci srq->armed = true; 16108c2ecf20Sopenharmony_ci 16118c2ecf20Sopenharmony_ci srq->is_kernel_res = !udata; 16128c2ecf20Sopenharmony_ci 16138c2ecf20Sopenharmony_ci if (udata) 16148c2ecf20Sopenharmony_ci srq->recvq = 16158c2ecf20Sopenharmony_ci vmalloc_user(srq->num_rqe * sizeof(struct siw_rqe)); 16168c2ecf20Sopenharmony_ci else 16178c2ecf20Sopenharmony_ci srq->recvq = vzalloc(srq->num_rqe * sizeof(struct siw_rqe)); 16188c2ecf20Sopenharmony_ci 16198c2ecf20Sopenharmony_ci if (srq->recvq == NULL) { 16208c2ecf20Sopenharmony_ci rv = -ENOMEM; 16218c2ecf20Sopenharmony_ci goto err_out; 16228c2ecf20Sopenharmony_ci } 16238c2ecf20Sopenharmony_ci if (udata) { 16248c2ecf20Sopenharmony_ci struct siw_uresp_create_srq uresp = {}; 16258c2ecf20Sopenharmony_ci size_t length = srq->num_rqe * sizeof(struct siw_rqe); 16268c2ecf20Sopenharmony_ci 16278c2ecf20Sopenharmony_ci srq->srq_entry = 16288c2ecf20Sopenharmony_ci siw_mmap_entry_insert(ctx, srq->recvq, 16298c2ecf20Sopenharmony_ci length, &uresp.srq_key); 16308c2ecf20Sopenharmony_ci if (!srq->srq_entry) { 16318c2ecf20Sopenharmony_ci rv = -ENOMEM; 16328c2ecf20Sopenharmony_ci goto err_out; 16338c2ecf20Sopenharmony_ci } 16348c2ecf20Sopenharmony_ci 16358c2ecf20Sopenharmony_ci uresp.num_rqe = srq->num_rqe; 16368c2ecf20Sopenharmony_ci 16378c2ecf20Sopenharmony_ci if (udata->outlen < sizeof(uresp)) { 16388c2ecf20Sopenharmony_ci rv = -EINVAL; 16398c2ecf20Sopenharmony_ci goto err_out; 16408c2ecf20Sopenharmony_ci } 16418c2ecf20Sopenharmony_ci rv = ib_copy_to_udata(udata, &uresp, sizeof(uresp)); 16428c2ecf20Sopenharmony_ci if (rv) 16438c2ecf20Sopenharmony_ci goto err_out; 16448c2ecf20Sopenharmony_ci } 16458c2ecf20Sopenharmony_ci spin_lock_init(&srq->lock); 16468c2ecf20Sopenharmony_ci 16478c2ecf20Sopenharmony_ci siw_dbg_pd(base_srq->pd, "[SRQ]: success\n"); 16488c2ecf20Sopenharmony_ci 16498c2ecf20Sopenharmony_ci return 0; 16508c2ecf20Sopenharmony_ci 16518c2ecf20Sopenharmony_cierr_out: 16528c2ecf20Sopenharmony_ci if (srq->recvq) { 16538c2ecf20Sopenharmony_ci if (ctx) 16548c2ecf20Sopenharmony_ci rdma_user_mmap_entry_remove(srq->srq_entry); 16558c2ecf20Sopenharmony_ci vfree(srq->recvq); 16568c2ecf20Sopenharmony_ci } 16578c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_srq); 16588c2ecf20Sopenharmony_ci 16598c2ecf20Sopenharmony_ci return rv; 16608c2ecf20Sopenharmony_ci} 16618c2ecf20Sopenharmony_ci 16628c2ecf20Sopenharmony_ci/* 16638c2ecf20Sopenharmony_ci * siw_modify_srq() 16648c2ecf20Sopenharmony_ci * 16658c2ecf20Sopenharmony_ci * Modify SRQ. The caller may resize SRQ and/or set/reset notification 16668c2ecf20Sopenharmony_ci * limit and (re)arm IB_EVENT_SRQ_LIMIT_REACHED notification. 16678c2ecf20Sopenharmony_ci * 16688c2ecf20Sopenharmony_ci * NOTE: it is unclear if RDMA core allows for changing the MAX_SGE 16698c2ecf20Sopenharmony_ci * parameter. siw_modify_srq() does not check the attrs->max_sge param. 16708c2ecf20Sopenharmony_ci */ 16718c2ecf20Sopenharmony_ciint siw_modify_srq(struct ib_srq *base_srq, struct ib_srq_attr *attrs, 16728c2ecf20Sopenharmony_ci enum ib_srq_attr_mask attr_mask, struct ib_udata *udata) 16738c2ecf20Sopenharmony_ci{ 16748c2ecf20Sopenharmony_ci struct siw_srq *srq = to_siw_srq(base_srq); 16758c2ecf20Sopenharmony_ci unsigned long flags; 16768c2ecf20Sopenharmony_ci int rv = 0; 16778c2ecf20Sopenharmony_ci 16788c2ecf20Sopenharmony_ci spin_lock_irqsave(&srq->lock, flags); 16798c2ecf20Sopenharmony_ci 16808c2ecf20Sopenharmony_ci if (attr_mask & IB_SRQ_MAX_WR) { 16818c2ecf20Sopenharmony_ci /* resize request not yet supported */ 16828c2ecf20Sopenharmony_ci rv = -EOPNOTSUPP; 16838c2ecf20Sopenharmony_ci goto out; 16848c2ecf20Sopenharmony_ci } 16858c2ecf20Sopenharmony_ci if (attr_mask & IB_SRQ_LIMIT) { 16868c2ecf20Sopenharmony_ci if (attrs->srq_limit) { 16878c2ecf20Sopenharmony_ci if (unlikely(attrs->srq_limit > srq->num_rqe)) { 16888c2ecf20Sopenharmony_ci rv = -EINVAL; 16898c2ecf20Sopenharmony_ci goto out; 16908c2ecf20Sopenharmony_ci } 16918c2ecf20Sopenharmony_ci srq->armed = true; 16928c2ecf20Sopenharmony_ci } else { 16938c2ecf20Sopenharmony_ci srq->armed = false; 16948c2ecf20Sopenharmony_ci } 16958c2ecf20Sopenharmony_ci srq->limit = attrs->srq_limit; 16968c2ecf20Sopenharmony_ci } 16978c2ecf20Sopenharmony_ciout: 16988c2ecf20Sopenharmony_ci spin_unlock_irqrestore(&srq->lock, flags); 16998c2ecf20Sopenharmony_ci 17008c2ecf20Sopenharmony_ci return rv; 17018c2ecf20Sopenharmony_ci} 17028c2ecf20Sopenharmony_ci 17038c2ecf20Sopenharmony_ci/* 17048c2ecf20Sopenharmony_ci * siw_query_srq() 17058c2ecf20Sopenharmony_ci * 17068c2ecf20Sopenharmony_ci * Query SRQ attributes. 17078c2ecf20Sopenharmony_ci */ 17088c2ecf20Sopenharmony_ciint siw_query_srq(struct ib_srq *base_srq, struct ib_srq_attr *attrs) 17098c2ecf20Sopenharmony_ci{ 17108c2ecf20Sopenharmony_ci struct siw_srq *srq = to_siw_srq(base_srq); 17118c2ecf20Sopenharmony_ci unsigned long flags; 17128c2ecf20Sopenharmony_ci 17138c2ecf20Sopenharmony_ci spin_lock_irqsave(&srq->lock, flags); 17148c2ecf20Sopenharmony_ci 17158c2ecf20Sopenharmony_ci attrs->max_wr = srq->num_rqe; 17168c2ecf20Sopenharmony_ci attrs->max_sge = srq->max_sge; 17178c2ecf20Sopenharmony_ci attrs->srq_limit = srq->limit; 17188c2ecf20Sopenharmony_ci 17198c2ecf20Sopenharmony_ci spin_unlock_irqrestore(&srq->lock, flags); 17208c2ecf20Sopenharmony_ci 17218c2ecf20Sopenharmony_ci return 0; 17228c2ecf20Sopenharmony_ci} 17238c2ecf20Sopenharmony_ci 17248c2ecf20Sopenharmony_ci/* 17258c2ecf20Sopenharmony_ci * siw_destroy_srq() 17268c2ecf20Sopenharmony_ci * 17278c2ecf20Sopenharmony_ci * Destroy SRQ. 17288c2ecf20Sopenharmony_ci * It is assumed that the SRQ is not referenced by any 17298c2ecf20Sopenharmony_ci * QP anymore - the code trusts the RDMA core environment to keep track 17308c2ecf20Sopenharmony_ci * of QP references. 17318c2ecf20Sopenharmony_ci */ 17328c2ecf20Sopenharmony_ciint siw_destroy_srq(struct ib_srq *base_srq, struct ib_udata *udata) 17338c2ecf20Sopenharmony_ci{ 17348c2ecf20Sopenharmony_ci struct siw_srq *srq = to_siw_srq(base_srq); 17358c2ecf20Sopenharmony_ci struct siw_device *sdev = to_siw_dev(base_srq->device); 17368c2ecf20Sopenharmony_ci struct siw_ucontext *ctx = 17378c2ecf20Sopenharmony_ci rdma_udata_to_drv_context(udata, struct siw_ucontext, 17388c2ecf20Sopenharmony_ci base_ucontext); 17398c2ecf20Sopenharmony_ci 17408c2ecf20Sopenharmony_ci if (ctx) 17418c2ecf20Sopenharmony_ci rdma_user_mmap_entry_remove(srq->srq_entry); 17428c2ecf20Sopenharmony_ci vfree(srq->recvq); 17438c2ecf20Sopenharmony_ci atomic_dec(&sdev->num_srq); 17448c2ecf20Sopenharmony_ci return 0; 17458c2ecf20Sopenharmony_ci} 17468c2ecf20Sopenharmony_ci 17478c2ecf20Sopenharmony_ci/* 17488c2ecf20Sopenharmony_ci * siw_post_srq_recv() 17498c2ecf20Sopenharmony_ci * 17508c2ecf20Sopenharmony_ci * Post a list of receive queue elements to SRQ. 17518c2ecf20Sopenharmony_ci * NOTE: The function does not check or lock a certain SRQ state 17528c2ecf20Sopenharmony_ci * during the post operation. The code simply trusts the 17538c2ecf20Sopenharmony_ci * RDMA core environment. 17548c2ecf20Sopenharmony_ci * 17558c2ecf20Sopenharmony_ci * @base_srq: Base SRQ contained in siw SRQ 17568c2ecf20Sopenharmony_ci * @wr: List of R-WR's 17578c2ecf20Sopenharmony_ci * @bad_wr: Updated to failing WR if posting fails. 17588c2ecf20Sopenharmony_ci */ 17598c2ecf20Sopenharmony_ciint siw_post_srq_recv(struct ib_srq *base_srq, const struct ib_recv_wr *wr, 17608c2ecf20Sopenharmony_ci const struct ib_recv_wr **bad_wr) 17618c2ecf20Sopenharmony_ci{ 17628c2ecf20Sopenharmony_ci struct siw_srq *srq = to_siw_srq(base_srq); 17638c2ecf20Sopenharmony_ci unsigned long flags; 17648c2ecf20Sopenharmony_ci int rv = 0; 17658c2ecf20Sopenharmony_ci 17668c2ecf20Sopenharmony_ci if (unlikely(!srq->is_kernel_res)) { 17678c2ecf20Sopenharmony_ci siw_dbg_pd(base_srq->pd, 17688c2ecf20Sopenharmony_ci "[SRQ]: no kernel post_recv for mapped srq\n"); 17698c2ecf20Sopenharmony_ci rv = -EINVAL; 17708c2ecf20Sopenharmony_ci goto out; 17718c2ecf20Sopenharmony_ci } 17728c2ecf20Sopenharmony_ci /* 17738c2ecf20Sopenharmony_ci * Serialize potentially multiple producers. 17748c2ecf20Sopenharmony_ci * Also needed to serialize potentially multiple 17758c2ecf20Sopenharmony_ci * consumers. 17768c2ecf20Sopenharmony_ci */ 17778c2ecf20Sopenharmony_ci spin_lock_irqsave(&srq->lock, flags); 17788c2ecf20Sopenharmony_ci 17798c2ecf20Sopenharmony_ci while (wr) { 17808c2ecf20Sopenharmony_ci u32 idx = srq->rq_put % srq->num_rqe; 17818c2ecf20Sopenharmony_ci struct siw_rqe *rqe = &srq->recvq[idx]; 17828c2ecf20Sopenharmony_ci 17838c2ecf20Sopenharmony_ci if (rqe->flags) { 17848c2ecf20Sopenharmony_ci siw_dbg_pd(base_srq->pd, "SRQ full\n"); 17858c2ecf20Sopenharmony_ci rv = -ENOMEM; 17868c2ecf20Sopenharmony_ci break; 17878c2ecf20Sopenharmony_ci } 17888c2ecf20Sopenharmony_ci if (unlikely(wr->num_sge > srq->max_sge)) { 17898c2ecf20Sopenharmony_ci siw_dbg_pd(base_srq->pd, 17908c2ecf20Sopenharmony_ci "[SRQ]: too many sge's: %d\n", wr->num_sge); 17918c2ecf20Sopenharmony_ci rv = -EINVAL; 17928c2ecf20Sopenharmony_ci break; 17938c2ecf20Sopenharmony_ci } 17948c2ecf20Sopenharmony_ci rqe->id = wr->wr_id; 17958c2ecf20Sopenharmony_ci rqe->num_sge = wr->num_sge; 17968c2ecf20Sopenharmony_ci siw_copy_sgl(wr->sg_list, rqe->sge, wr->num_sge); 17978c2ecf20Sopenharmony_ci 17988c2ecf20Sopenharmony_ci /* Make sure S-RQE is completely written before valid */ 17998c2ecf20Sopenharmony_ci smp_wmb(); 18008c2ecf20Sopenharmony_ci 18018c2ecf20Sopenharmony_ci rqe->flags = SIW_WQE_VALID; 18028c2ecf20Sopenharmony_ci 18038c2ecf20Sopenharmony_ci srq->rq_put++; 18048c2ecf20Sopenharmony_ci wr = wr->next; 18058c2ecf20Sopenharmony_ci } 18068c2ecf20Sopenharmony_ci spin_unlock_irqrestore(&srq->lock, flags); 18078c2ecf20Sopenharmony_ciout: 18088c2ecf20Sopenharmony_ci if (unlikely(rv < 0)) { 18098c2ecf20Sopenharmony_ci siw_dbg_pd(base_srq->pd, "[SRQ]: error %d\n", rv); 18108c2ecf20Sopenharmony_ci *bad_wr = wr; 18118c2ecf20Sopenharmony_ci } 18128c2ecf20Sopenharmony_ci return rv; 18138c2ecf20Sopenharmony_ci} 18148c2ecf20Sopenharmony_ci 18158c2ecf20Sopenharmony_civoid siw_qp_event(struct siw_qp *qp, enum ib_event_type etype) 18168c2ecf20Sopenharmony_ci{ 18178c2ecf20Sopenharmony_ci struct ib_event event; 18188c2ecf20Sopenharmony_ci struct ib_qp *base_qp = &qp->base_qp; 18198c2ecf20Sopenharmony_ci 18208c2ecf20Sopenharmony_ci /* 18218c2ecf20Sopenharmony_ci * Do not report asynchronous errors on QP which gets 18228c2ecf20Sopenharmony_ci * destroyed via verbs interface (siw_destroy_qp()) 18238c2ecf20Sopenharmony_ci */ 18248c2ecf20Sopenharmony_ci if (qp->attrs.flags & SIW_QP_IN_DESTROY) 18258c2ecf20Sopenharmony_ci return; 18268c2ecf20Sopenharmony_ci 18278c2ecf20Sopenharmony_ci event.event = etype; 18288c2ecf20Sopenharmony_ci event.device = base_qp->device; 18298c2ecf20Sopenharmony_ci event.element.qp = base_qp; 18308c2ecf20Sopenharmony_ci 18318c2ecf20Sopenharmony_ci if (base_qp->event_handler) { 18328c2ecf20Sopenharmony_ci siw_dbg_qp(qp, "reporting event %d\n", etype); 18338c2ecf20Sopenharmony_ci base_qp->event_handler(&event, base_qp->qp_context); 18348c2ecf20Sopenharmony_ci } 18358c2ecf20Sopenharmony_ci} 18368c2ecf20Sopenharmony_ci 18378c2ecf20Sopenharmony_civoid siw_cq_event(struct siw_cq *cq, enum ib_event_type etype) 18388c2ecf20Sopenharmony_ci{ 18398c2ecf20Sopenharmony_ci struct ib_event event; 18408c2ecf20Sopenharmony_ci struct ib_cq *base_cq = &cq->base_cq; 18418c2ecf20Sopenharmony_ci 18428c2ecf20Sopenharmony_ci event.event = etype; 18438c2ecf20Sopenharmony_ci event.device = base_cq->device; 18448c2ecf20Sopenharmony_ci event.element.cq = base_cq; 18458c2ecf20Sopenharmony_ci 18468c2ecf20Sopenharmony_ci if (base_cq->event_handler) { 18478c2ecf20Sopenharmony_ci siw_dbg_cq(cq, "reporting CQ event %d\n", etype); 18488c2ecf20Sopenharmony_ci base_cq->event_handler(&event, base_cq->cq_context); 18498c2ecf20Sopenharmony_ci } 18508c2ecf20Sopenharmony_ci} 18518c2ecf20Sopenharmony_ci 18528c2ecf20Sopenharmony_civoid siw_srq_event(struct siw_srq *srq, enum ib_event_type etype) 18538c2ecf20Sopenharmony_ci{ 18548c2ecf20Sopenharmony_ci struct ib_event event; 18558c2ecf20Sopenharmony_ci struct ib_srq *base_srq = &srq->base_srq; 18568c2ecf20Sopenharmony_ci 18578c2ecf20Sopenharmony_ci event.event = etype; 18588c2ecf20Sopenharmony_ci event.device = base_srq->device; 18598c2ecf20Sopenharmony_ci event.element.srq = base_srq; 18608c2ecf20Sopenharmony_ci 18618c2ecf20Sopenharmony_ci if (base_srq->event_handler) { 18628c2ecf20Sopenharmony_ci siw_dbg_pd(srq->base_srq.pd, 18638c2ecf20Sopenharmony_ci "reporting SRQ event %d\n", etype); 18648c2ecf20Sopenharmony_ci base_srq->event_handler(&event, base_srq->srq_context); 18658c2ecf20Sopenharmony_ci } 18668c2ecf20Sopenharmony_ci} 18678c2ecf20Sopenharmony_ci 18688c2ecf20Sopenharmony_civoid siw_port_event(struct siw_device *sdev, u8 port, enum ib_event_type etype) 18698c2ecf20Sopenharmony_ci{ 18708c2ecf20Sopenharmony_ci struct ib_event event; 18718c2ecf20Sopenharmony_ci 18728c2ecf20Sopenharmony_ci event.event = etype; 18738c2ecf20Sopenharmony_ci event.device = &sdev->base_dev; 18748c2ecf20Sopenharmony_ci event.element.port_num = port; 18758c2ecf20Sopenharmony_ci 18768c2ecf20Sopenharmony_ci siw_dbg(&sdev->base_dev, "reporting port event %d\n", etype); 18778c2ecf20Sopenharmony_ci 18788c2ecf20Sopenharmony_ci ib_dispatch_event(&event); 18798c2ecf20Sopenharmony_ci} 1880