162306a36Sopenharmony_ci/* 262306a36Sopenharmony_ci * Copyright (c) 2007, 2008, 2009 QLogic Corporation. All rights reserved. 362306a36Sopenharmony_ci * 462306a36Sopenharmony_ci * This software is available to you under a choice of one of two 562306a36Sopenharmony_ci * licenses. You may choose to be licensed under the terms of the GNU 662306a36Sopenharmony_ci * General Public License (GPL) Version 2, available from the file 762306a36Sopenharmony_ci * COPYING in the main directory of this source tree, or the 862306a36Sopenharmony_ci * OpenIB.org BSD license below: 962306a36Sopenharmony_ci * 1062306a36Sopenharmony_ci * Redistribution and use in source and binary forms, with or 1162306a36Sopenharmony_ci * without modification, are permitted provided that the following 1262306a36Sopenharmony_ci * conditions are met: 1362306a36Sopenharmony_ci * 1462306a36Sopenharmony_ci * - Redistributions of source code must retain the above 1562306a36Sopenharmony_ci * copyright notice, this list of conditions and the following 1662306a36Sopenharmony_ci * disclaimer. 1762306a36Sopenharmony_ci * 1862306a36Sopenharmony_ci * - Redistributions in binary form must reproduce the above 1962306a36Sopenharmony_ci * copyright notice, this list of conditions and the following 2062306a36Sopenharmony_ci * disclaimer in the documentation and/or other materials 2162306a36Sopenharmony_ci * provided with the distribution. 2262306a36Sopenharmony_ci * 2362306a36Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 2462306a36Sopenharmony_ci * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 2562306a36Sopenharmony_ci * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 2662306a36Sopenharmony_ci * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 2762306a36Sopenharmony_ci * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 2862306a36Sopenharmony_ci * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 2962306a36Sopenharmony_ci * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 3062306a36Sopenharmony_ci * SOFTWARE. 3162306a36Sopenharmony_ci */ 3262306a36Sopenharmony_ci#include <linux/mm.h> 3362306a36Sopenharmony_ci#include <linux/types.h> 3462306a36Sopenharmony_ci#include <linux/device.h> 3562306a36Sopenharmony_ci#include <linux/dmapool.h> 3662306a36Sopenharmony_ci#include <linux/slab.h> 3762306a36Sopenharmony_ci#include <linux/list.h> 3862306a36Sopenharmony_ci#include <linux/highmem.h> 3962306a36Sopenharmony_ci#include <linux/io.h> 4062306a36Sopenharmony_ci#include <linux/uio.h> 4162306a36Sopenharmony_ci#include <linux/rbtree.h> 4262306a36Sopenharmony_ci#include <linux/spinlock.h> 4362306a36Sopenharmony_ci#include <linux/delay.h> 4462306a36Sopenharmony_ci 4562306a36Sopenharmony_ci#include "qib.h" 4662306a36Sopenharmony_ci#include "qib_user_sdma.h" 4762306a36Sopenharmony_ci 4862306a36Sopenharmony_ci/* minimum size of header */ 4962306a36Sopenharmony_ci#define QIB_USER_SDMA_MIN_HEADER_LENGTH 64 5062306a36Sopenharmony_ci/* expected size of headers (for dma_pool) */ 5162306a36Sopenharmony_ci#define QIB_USER_SDMA_EXP_HEADER_LENGTH 64 5262306a36Sopenharmony_ci/* attempt to drain the queue for 5secs */ 5362306a36Sopenharmony_ci#define QIB_USER_SDMA_DRAIN_TIMEOUT 250 5462306a36Sopenharmony_ci 5562306a36Sopenharmony_ci/* 5662306a36Sopenharmony_ci * track how many times a process open this driver. 5762306a36Sopenharmony_ci */ 5862306a36Sopenharmony_cistatic struct rb_root qib_user_sdma_rb_root = RB_ROOT; 5962306a36Sopenharmony_ci 6062306a36Sopenharmony_cistruct qib_user_sdma_rb_node { 6162306a36Sopenharmony_ci struct rb_node node; 6262306a36Sopenharmony_ci int refcount; 6362306a36Sopenharmony_ci pid_t pid; 6462306a36Sopenharmony_ci}; 6562306a36Sopenharmony_ci 6662306a36Sopenharmony_cistruct qib_user_sdma_pkt { 6762306a36Sopenharmony_ci struct list_head list; /* list element */ 6862306a36Sopenharmony_ci 6962306a36Sopenharmony_ci u8 tiddma; /* if this is NEW tid-sdma */ 7062306a36Sopenharmony_ci u8 largepkt; /* this is large pkt from kmalloc */ 7162306a36Sopenharmony_ci u16 frag_size; /* frag size used by PSM */ 7262306a36Sopenharmony_ci u16 index; /* last header index or push index */ 7362306a36Sopenharmony_ci u16 naddr; /* dimension of addr (1..3) ... */ 7462306a36Sopenharmony_ci u16 addrlimit; /* addr array size */ 7562306a36Sopenharmony_ci u16 tidsmidx; /* current tidsm index */ 7662306a36Sopenharmony_ci u16 tidsmcount; /* tidsm array item count */ 7762306a36Sopenharmony_ci u16 payload_size; /* payload size so far for header */ 7862306a36Sopenharmony_ci u32 bytes_togo; /* bytes for processing */ 7962306a36Sopenharmony_ci u32 counter; /* sdma pkts queued counter for this entry */ 8062306a36Sopenharmony_ci struct qib_tid_session_member *tidsm; /* tid session member array */ 8162306a36Sopenharmony_ci struct qib_user_sdma_queue *pq; /* which pq this pkt belongs to */ 8262306a36Sopenharmony_ci u64 added; /* global descq number of entries */ 8362306a36Sopenharmony_ci 8462306a36Sopenharmony_ci struct { 8562306a36Sopenharmony_ci u16 offset; /* offset for kvaddr, addr */ 8662306a36Sopenharmony_ci u16 length; /* length in page */ 8762306a36Sopenharmony_ci u16 first_desc; /* first desc */ 8862306a36Sopenharmony_ci u16 last_desc; /* last desc */ 8962306a36Sopenharmony_ci u16 put_page; /* should we put_page? */ 9062306a36Sopenharmony_ci u16 dma_mapped; /* is page dma_mapped? */ 9162306a36Sopenharmony_ci u16 dma_length; /* for dma_unmap_page() */ 9262306a36Sopenharmony_ci u16 padding; 9362306a36Sopenharmony_ci struct page *page; /* may be NULL (coherent mem) */ 9462306a36Sopenharmony_ci void *kvaddr; /* FIXME: only for pio hack */ 9562306a36Sopenharmony_ci dma_addr_t addr; 9662306a36Sopenharmony_ci } addr[4]; /* max pages, any more and we coalesce */ 9762306a36Sopenharmony_ci}; 9862306a36Sopenharmony_ci 9962306a36Sopenharmony_cistruct qib_user_sdma_queue { 10062306a36Sopenharmony_ci /* 10162306a36Sopenharmony_ci * pkts sent to dma engine are queued on this 10262306a36Sopenharmony_ci * list head. the type of the elements of this 10362306a36Sopenharmony_ci * list are struct qib_user_sdma_pkt... 10462306a36Sopenharmony_ci */ 10562306a36Sopenharmony_ci struct list_head sent; 10662306a36Sopenharmony_ci 10762306a36Sopenharmony_ci /* 10862306a36Sopenharmony_ci * Because above list will be accessed by both process and 10962306a36Sopenharmony_ci * signal handler, we need a spinlock for it. 11062306a36Sopenharmony_ci */ 11162306a36Sopenharmony_ci spinlock_t sent_lock ____cacheline_aligned_in_smp; 11262306a36Sopenharmony_ci 11362306a36Sopenharmony_ci /* headers with expected length are allocated from here... */ 11462306a36Sopenharmony_ci char header_cache_name[64]; 11562306a36Sopenharmony_ci struct dma_pool *header_cache; 11662306a36Sopenharmony_ci 11762306a36Sopenharmony_ci /* packets are allocated from the slab cache... */ 11862306a36Sopenharmony_ci char pkt_slab_name[64]; 11962306a36Sopenharmony_ci struct kmem_cache *pkt_slab; 12062306a36Sopenharmony_ci 12162306a36Sopenharmony_ci /* as packets go on the queued queue, they are counted... */ 12262306a36Sopenharmony_ci u32 counter; 12362306a36Sopenharmony_ci u32 sent_counter; 12462306a36Sopenharmony_ci /* pending packets, not sending yet */ 12562306a36Sopenharmony_ci u32 num_pending; 12662306a36Sopenharmony_ci /* sending packets, not complete yet */ 12762306a36Sopenharmony_ci u32 num_sending; 12862306a36Sopenharmony_ci /* global descq number of entry of last sending packet */ 12962306a36Sopenharmony_ci u64 added; 13062306a36Sopenharmony_ci 13162306a36Sopenharmony_ci /* dma page table */ 13262306a36Sopenharmony_ci struct rb_root dma_pages_root; 13362306a36Sopenharmony_ci 13462306a36Sopenharmony_ci struct qib_user_sdma_rb_node *sdma_rb_node; 13562306a36Sopenharmony_ci 13662306a36Sopenharmony_ci /* protect everything above... */ 13762306a36Sopenharmony_ci struct mutex lock; 13862306a36Sopenharmony_ci}; 13962306a36Sopenharmony_ci 14062306a36Sopenharmony_cistatic struct qib_user_sdma_rb_node * 14162306a36Sopenharmony_ciqib_user_sdma_rb_search(struct rb_root *root, pid_t pid) 14262306a36Sopenharmony_ci{ 14362306a36Sopenharmony_ci struct qib_user_sdma_rb_node *sdma_rb_node; 14462306a36Sopenharmony_ci struct rb_node *node = root->rb_node; 14562306a36Sopenharmony_ci 14662306a36Sopenharmony_ci while (node) { 14762306a36Sopenharmony_ci sdma_rb_node = rb_entry(node, struct qib_user_sdma_rb_node, 14862306a36Sopenharmony_ci node); 14962306a36Sopenharmony_ci if (pid < sdma_rb_node->pid) 15062306a36Sopenharmony_ci node = node->rb_left; 15162306a36Sopenharmony_ci else if (pid > sdma_rb_node->pid) 15262306a36Sopenharmony_ci node = node->rb_right; 15362306a36Sopenharmony_ci else 15462306a36Sopenharmony_ci return sdma_rb_node; 15562306a36Sopenharmony_ci } 15662306a36Sopenharmony_ci return NULL; 15762306a36Sopenharmony_ci} 15862306a36Sopenharmony_ci 15962306a36Sopenharmony_cistatic int 16062306a36Sopenharmony_ciqib_user_sdma_rb_insert(struct rb_root *root, struct qib_user_sdma_rb_node *new) 16162306a36Sopenharmony_ci{ 16262306a36Sopenharmony_ci struct rb_node **node = &(root->rb_node); 16362306a36Sopenharmony_ci struct rb_node *parent = NULL; 16462306a36Sopenharmony_ci struct qib_user_sdma_rb_node *got; 16562306a36Sopenharmony_ci 16662306a36Sopenharmony_ci while (*node) { 16762306a36Sopenharmony_ci got = rb_entry(*node, struct qib_user_sdma_rb_node, node); 16862306a36Sopenharmony_ci parent = *node; 16962306a36Sopenharmony_ci if (new->pid < got->pid) 17062306a36Sopenharmony_ci node = &((*node)->rb_left); 17162306a36Sopenharmony_ci else if (new->pid > got->pid) 17262306a36Sopenharmony_ci node = &((*node)->rb_right); 17362306a36Sopenharmony_ci else 17462306a36Sopenharmony_ci return 0; 17562306a36Sopenharmony_ci } 17662306a36Sopenharmony_ci 17762306a36Sopenharmony_ci rb_link_node(&new->node, parent, node); 17862306a36Sopenharmony_ci rb_insert_color(&new->node, root); 17962306a36Sopenharmony_ci return 1; 18062306a36Sopenharmony_ci} 18162306a36Sopenharmony_ci 18262306a36Sopenharmony_cistruct qib_user_sdma_queue * 18362306a36Sopenharmony_ciqib_user_sdma_queue_create(struct device *dev, int unit, int ctxt, int sctxt) 18462306a36Sopenharmony_ci{ 18562306a36Sopenharmony_ci struct qib_user_sdma_queue *pq = 18662306a36Sopenharmony_ci kmalloc(sizeof(struct qib_user_sdma_queue), GFP_KERNEL); 18762306a36Sopenharmony_ci struct qib_user_sdma_rb_node *sdma_rb_node; 18862306a36Sopenharmony_ci 18962306a36Sopenharmony_ci if (!pq) 19062306a36Sopenharmony_ci goto done; 19162306a36Sopenharmony_ci 19262306a36Sopenharmony_ci pq->counter = 0; 19362306a36Sopenharmony_ci pq->sent_counter = 0; 19462306a36Sopenharmony_ci pq->num_pending = 0; 19562306a36Sopenharmony_ci pq->num_sending = 0; 19662306a36Sopenharmony_ci pq->added = 0; 19762306a36Sopenharmony_ci pq->sdma_rb_node = NULL; 19862306a36Sopenharmony_ci 19962306a36Sopenharmony_ci INIT_LIST_HEAD(&pq->sent); 20062306a36Sopenharmony_ci spin_lock_init(&pq->sent_lock); 20162306a36Sopenharmony_ci mutex_init(&pq->lock); 20262306a36Sopenharmony_ci 20362306a36Sopenharmony_ci snprintf(pq->pkt_slab_name, sizeof(pq->pkt_slab_name), 20462306a36Sopenharmony_ci "qib-user-sdma-pkts-%u-%02u.%02u", unit, ctxt, sctxt); 20562306a36Sopenharmony_ci pq->pkt_slab = kmem_cache_create(pq->pkt_slab_name, 20662306a36Sopenharmony_ci sizeof(struct qib_user_sdma_pkt), 20762306a36Sopenharmony_ci 0, 0, NULL); 20862306a36Sopenharmony_ci 20962306a36Sopenharmony_ci if (!pq->pkt_slab) 21062306a36Sopenharmony_ci goto err_kfree; 21162306a36Sopenharmony_ci 21262306a36Sopenharmony_ci snprintf(pq->header_cache_name, sizeof(pq->header_cache_name), 21362306a36Sopenharmony_ci "qib-user-sdma-headers-%u-%02u.%02u", unit, ctxt, sctxt); 21462306a36Sopenharmony_ci pq->header_cache = dma_pool_create(pq->header_cache_name, 21562306a36Sopenharmony_ci dev, 21662306a36Sopenharmony_ci QIB_USER_SDMA_EXP_HEADER_LENGTH, 21762306a36Sopenharmony_ci 4, 0); 21862306a36Sopenharmony_ci if (!pq->header_cache) 21962306a36Sopenharmony_ci goto err_slab; 22062306a36Sopenharmony_ci 22162306a36Sopenharmony_ci pq->dma_pages_root = RB_ROOT; 22262306a36Sopenharmony_ci 22362306a36Sopenharmony_ci sdma_rb_node = qib_user_sdma_rb_search(&qib_user_sdma_rb_root, 22462306a36Sopenharmony_ci current->pid); 22562306a36Sopenharmony_ci if (sdma_rb_node) { 22662306a36Sopenharmony_ci sdma_rb_node->refcount++; 22762306a36Sopenharmony_ci } else { 22862306a36Sopenharmony_ci sdma_rb_node = kmalloc(sizeof( 22962306a36Sopenharmony_ci struct qib_user_sdma_rb_node), GFP_KERNEL); 23062306a36Sopenharmony_ci if (!sdma_rb_node) 23162306a36Sopenharmony_ci goto err_rb; 23262306a36Sopenharmony_ci 23362306a36Sopenharmony_ci sdma_rb_node->refcount = 1; 23462306a36Sopenharmony_ci sdma_rb_node->pid = current->pid; 23562306a36Sopenharmony_ci 23662306a36Sopenharmony_ci qib_user_sdma_rb_insert(&qib_user_sdma_rb_root, sdma_rb_node); 23762306a36Sopenharmony_ci } 23862306a36Sopenharmony_ci pq->sdma_rb_node = sdma_rb_node; 23962306a36Sopenharmony_ci 24062306a36Sopenharmony_ci goto done; 24162306a36Sopenharmony_ci 24262306a36Sopenharmony_cierr_rb: 24362306a36Sopenharmony_ci dma_pool_destroy(pq->header_cache); 24462306a36Sopenharmony_cierr_slab: 24562306a36Sopenharmony_ci kmem_cache_destroy(pq->pkt_slab); 24662306a36Sopenharmony_cierr_kfree: 24762306a36Sopenharmony_ci kfree(pq); 24862306a36Sopenharmony_ci pq = NULL; 24962306a36Sopenharmony_ci 25062306a36Sopenharmony_cidone: 25162306a36Sopenharmony_ci return pq; 25262306a36Sopenharmony_ci} 25362306a36Sopenharmony_ci 25462306a36Sopenharmony_cistatic void qib_user_sdma_init_frag(struct qib_user_sdma_pkt *pkt, 25562306a36Sopenharmony_ci int i, u16 offset, u16 len, 25662306a36Sopenharmony_ci u16 first_desc, u16 last_desc, 25762306a36Sopenharmony_ci u16 put_page, u16 dma_mapped, 25862306a36Sopenharmony_ci struct page *page, void *kvaddr, 25962306a36Sopenharmony_ci dma_addr_t dma_addr, u16 dma_length) 26062306a36Sopenharmony_ci{ 26162306a36Sopenharmony_ci pkt->addr[i].offset = offset; 26262306a36Sopenharmony_ci pkt->addr[i].length = len; 26362306a36Sopenharmony_ci pkt->addr[i].first_desc = first_desc; 26462306a36Sopenharmony_ci pkt->addr[i].last_desc = last_desc; 26562306a36Sopenharmony_ci pkt->addr[i].put_page = put_page; 26662306a36Sopenharmony_ci pkt->addr[i].dma_mapped = dma_mapped; 26762306a36Sopenharmony_ci pkt->addr[i].page = page; 26862306a36Sopenharmony_ci pkt->addr[i].kvaddr = kvaddr; 26962306a36Sopenharmony_ci pkt->addr[i].addr = dma_addr; 27062306a36Sopenharmony_ci pkt->addr[i].dma_length = dma_length; 27162306a36Sopenharmony_ci} 27262306a36Sopenharmony_ci 27362306a36Sopenharmony_cistatic void *qib_user_sdma_alloc_header(struct qib_user_sdma_queue *pq, 27462306a36Sopenharmony_ci size_t len, dma_addr_t *dma_addr) 27562306a36Sopenharmony_ci{ 27662306a36Sopenharmony_ci void *hdr; 27762306a36Sopenharmony_ci 27862306a36Sopenharmony_ci if (len == QIB_USER_SDMA_EXP_HEADER_LENGTH) 27962306a36Sopenharmony_ci hdr = dma_pool_alloc(pq->header_cache, GFP_KERNEL, 28062306a36Sopenharmony_ci dma_addr); 28162306a36Sopenharmony_ci else 28262306a36Sopenharmony_ci hdr = NULL; 28362306a36Sopenharmony_ci 28462306a36Sopenharmony_ci if (!hdr) { 28562306a36Sopenharmony_ci hdr = kmalloc(len, GFP_KERNEL); 28662306a36Sopenharmony_ci if (!hdr) 28762306a36Sopenharmony_ci return NULL; 28862306a36Sopenharmony_ci 28962306a36Sopenharmony_ci *dma_addr = 0; 29062306a36Sopenharmony_ci } 29162306a36Sopenharmony_ci 29262306a36Sopenharmony_ci return hdr; 29362306a36Sopenharmony_ci} 29462306a36Sopenharmony_ci 29562306a36Sopenharmony_cistatic int qib_user_sdma_page_to_frags(const struct qib_devdata *dd, 29662306a36Sopenharmony_ci struct qib_user_sdma_queue *pq, 29762306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt, 29862306a36Sopenharmony_ci struct page *page, u16 put, 29962306a36Sopenharmony_ci u16 offset, u16 len, void *kvaddr) 30062306a36Sopenharmony_ci{ 30162306a36Sopenharmony_ci __le16 *pbc16; 30262306a36Sopenharmony_ci void *pbcvaddr; 30362306a36Sopenharmony_ci struct qib_message_header *hdr; 30462306a36Sopenharmony_ci u16 newlen, pbclen, lastdesc, dma_mapped; 30562306a36Sopenharmony_ci u32 vcto; 30662306a36Sopenharmony_ci union qib_seqnum seqnum; 30762306a36Sopenharmony_ci dma_addr_t pbcdaddr; 30862306a36Sopenharmony_ci dma_addr_t dma_addr = 30962306a36Sopenharmony_ci dma_map_page(&dd->pcidev->dev, 31062306a36Sopenharmony_ci page, offset, len, DMA_TO_DEVICE); 31162306a36Sopenharmony_ci int ret = 0; 31262306a36Sopenharmony_ci 31362306a36Sopenharmony_ci if (dma_mapping_error(&dd->pcidev->dev, dma_addr)) { 31462306a36Sopenharmony_ci /* 31562306a36Sopenharmony_ci * dma mapping error, pkt has not managed 31662306a36Sopenharmony_ci * this page yet, return the page here so 31762306a36Sopenharmony_ci * the caller can ignore this page. 31862306a36Sopenharmony_ci */ 31962306a36Sopenharmony_ci if (put) { 32062306a36Sopenharmony_ci unpin_user_page(page); 32162306a36Sopenharmony_ci } else { 32262306a36Sopenharmony_ci /* coalesce case */ 32362306a36Sopenharmony_ci __free_page(page); 32462306a36Sopenharmony_ci } 32562306a36Sopenharmony_ci ret = -ENOMEM; 32662306a36Sopenharmony_ci goto done; 32762306a36Sopenharmony_ci } 32862306a36Sopenharmony_ci offset = 0; 32962306a36Sopenharmony_ci dma_mapped = 1; 33062306a36Sopenharmony_ci 33162306a36Sopenharmony_ci 33262306a36Sopenharmony_cinext_fragment: 33362306a36Sopenharmony_ci 33462306a36Sopenharmony_ci /* 33562306a36Sopenharmony_ci * In tid-sdma, the transfer length is restricted by 33662306a36Sopenharmony_ci * receiver side current tid page length. 33762306a36Sopenharmony_ci */ 33862306a36Sopenharmony_ci if (pkt->tiddma && len > pkt->tidsm[pkt->tidsmidx].length) 33962306a36Sopenharmony_ci newlen = pkt->tidsm[pkt->tidsmidx].length; 34062306a36Sopenharmony_ci else 34162306a36Sopenharmony_ci newlen = len; 34262306a36Sopenharmony_ci 34362306a36Sopenharmony_ci /* 34462306a36Sopenharmony_ci * Then the transfer length is restricted by MTU. 34562306a36Sopenharmony_ci * the last descriptor flag is determined by: 34662306a36Sopenharmony_ci * 1. the current packet is at frag size length. 34762306a36Sopenharmony_ci * 2. the current tid page is done if tid-sdma. 34862306a36Sopenharmony_ci * 3. there is no more byte togo if sdma. 34962306a36Sopenharmony_ci */ 35062306a36Sopenharmony_ci lastdesc = 0; 35162306a36Sopenharmony_ci if ((pkt->payload_size + newlen) >= pkt->frag_size) { 35262306a36Sopenharmony_ci newlen = pkt->frag_size - pkt->payload_size; 35362306a36Sopenharmony_ci lastdesc = 1; 35462306a36Sopenharmony_ci } else if (pkt->tiddma) { 35562306a36Sopenharmony_ci if (newlen == pkt->tidsm[pkt->tidsmidx].length) 35662306a36Sopenharmony_ci lastdesc = 1; 35762306a36Sopenharmony_ci } else { 35862306a36Sopenharmony_ci if (newlen == pkt->bytes_togo) 35962306a36Sopenharmony_ci lastdesc = 1; 36062306a36Sopenharmony_ci } 36162306a36Sopenharmony_ci 36262306a36Sopenharmony_ci /* fill the next fragment in this page */ 36362306a36Sopenharmony_ci qib_user_sdma_init_frag(pkt, pkt->naddr, /* index */ 36462306a36Sopenharmony_ci offset, newlen, /* offset, len */ 36562306a36Sopenharmony_ci 0, lastdesc, /* first last desc */ 36662306a36Sopenharmony_ci put, dma_mapped, /* put page, dma mapped */ 36762306a36Sopenharmony_ci page, kvaddr, /* struct page, virt addr */ 36862306a36Sopenharmony_ci dma_addr, len); /* dma addr, dma length */ 36962306a36Sopenharmony_ci pkt->bytes_togo -= newlen; 37062306a36Sopenharmony_ci pkt->payload_size += newlen; 37162306a36Sopenharmony_ci pkt->naddr++; 37262306a36Sopenharmony_ci if (pkt->naddr == pkt->addrlimit) { 37362306a36Sopenharmony_ci ret = -EFAULT; 37462306a36Sopenharmony_ci goto done; 37562306a36Sopenharmony_ci } 37662306a36Sopenharmony_ci 37762306a36Sopenharmony_ci /* If there is no more byte togo. (lastdesc==1) */ 37862306a36Sopenharmony_ci if (pkt->bytes_togo == 0) { 37962306a36Sopenharmony_ci /* The packet is done, header is not dma mapped yet. 38062306a36Sopenharmony_ci * it should be from kmalloc */ 38162306a36Sopenharmony_ci if (!pkt->addr[pkt->index].addr) { 38262306a36Sopenharmony_ci pkt->addr[pkt->index].addr = 38362306a36Sopenharmony_ci dma_map_single(&dd->pcidev->dev, 38462306a36Sopenharmony_ci pkt->addr[pkt->index].kvaddr, 38562306a36Sopenharmony_ci pkt->addr[pkt->index].dma_length, 38662306a36Sopenharmony_ci DMA_TO_DEVICE); 38762306a36Sopenharmony_ci if (dma_mapping_error(&dd->pcidev->dev, 38862306a36Sopenharmony_ci pkt->addr[pkt->index].addr)) { 38962306a36Sopenharmony_ci ret = -ENOMEM; 39062306a36Sopenharmony_ci goto done; 39162306a36Sopenharmony_ci } 39262306a36Sopenharmony_ci pkt->addr[pkt->index].dma_mapped = 1; 39362306a36Sopenharmony_ci } 39462306a36Sopenharmony_ci 39562306a36Sopenharmony_ci goto done; 39662306a36Sopenharmony_ci } 39762306a36Sopenharmony_ci 39862306a36Sopenharmony_ci /* If tid-sdma, advance tid info. */ 39962306a36Sopenharmony_ci if (pkt->tiddma) { 40062306a36Sopenharmony_ci pkt->tidsm[pkt->tidsmidx].length -= newlen; 40162306a36Sopenharmony_ci if (pkt->tidsm[pkt->tidsmidx].length) { 40262306a36Sopenharmony_ci pkt->tidsm[pkt->tidsmidx].offset += newlen; 40362306a36Sopenharmony_ci } else { 40462306a36Sopenharmony_ci pkt->tidsmidx++; 40562306a36Sopenharmony_ci if (pkt->tidsmidx == pkt->tidsmcount) { 40662306a36Sopenharmony_ci ret = -EFAULT; 40762306a36Sopenharmony_ci goto done; 40862306a36Sopenharmony_ci } 40962306a36Sopenharmony_ci } 41062306a36Sopenharmony_ci } 41162306a36Sopenharmony_ci 41262306a36Sopenharmony_ci /* 41362306a36Sopenharmony_ci * If this is NOT the last descriptor. (newlen==len) 41462306a36Sopenharmony_ci * the current packet is not done yet, but the current 41562306a36Sopenharmony_ci * send side page is done. 41662306a36Sopenharmony_ci */ 41762306a36Sopenharmony_ci if (lastdesc == 0) 41862306a36Sopenharmony_ci goto done; 41962306a36Sopenharmony_ci 42062306a36Sopenharmony_ci /* 42162306a36Sopenharmony_ci * If running this driver under PSM with message size 42262306a36Sopenharmony_ci * fitting into one transfer unit, it is not possible 42362306a36Sopenharmony_ci * to pass this line. otherwise, it is a buggggg. 42462306a36Sopenharmony_ci */ 42562306a36Sopenharmony_ci 42662306a36Sopenharmony_ci /* 42762306a36Sopenharmony_ci * Since the current packet is done, and there are more 42862306a36Sopenharmony_ci * bytes togo, we need to create a new sdma header, copying 42962306a36Sopenharmony_ci * from previous sdma header and modify both. 43062306a36Sopenharmony_ci */ 43162306a36Sopenharmony_ci pbclen = pkt->addr[pkt->index].length; 43262306a36Sopenharmony_ci pbcvaddr = qib_user_sdma_alloc_header(pq, pbclen, &pbcdaddr); 43362306a36Sopenharmony_ci if (!pbcvaddr) { 43462306a36Sopenharmony_ci ret = -ENOMEM; 43562306a36Sopenharmony_ci goto done; 43662306a36Sopenharmony_ci } 43762306a36Sopenharmony_ci /* Copy the previous sdma header to new sdma header */ 43862306a36Sopenharmony_ci pbc16 = (__le16 *)pkt->addr[pkt->index].kvaddr; 43962306a36Sopenharmony_ci memcpy(pbcvaddr, pbc16, pbclen); 44062306a36Sopenharmony_ci 44162306a36Sopenharmony_ci /* Modify the previous sdma header */ 44262306a36Sopenharmony_ci hdr = (struct qib_message_header *)&pbc16[4]; 44362306a36Sopenharmony_ci 44462306a36Sopenharmony_ci /* New pbc length */ 44562306a36Sopenharmony_ci pbc16[0] = cpu_to_le16(le16_to_cpu(pbc16[0])-(pkt->bytes_togo>>2)); 44662306a36Sopenharmony_ci 44762306a36Sopenharmony_ci /* New packet length */ 44862306a36Sopenharmony_ci hdr->lrh[2] = cpu_to_be16(le16_to_cpu(pbc16[0])); 44962306a36Sopenharmony_ci 45062306a36Sopenharmony_ci if (pkt->tiddma) { 45162306a36Sopenharmony_ci /* turn on the header suppression */ 45262306a36Sopenharmony_ci hdr->iph.pkt_flags = 45362306a36Sopenharmony_ci cpu_to_le16(le16_to_cpu(hdr->iph.pkt_flags)|0x2); 45462306a36Sopenharmony_ci /* turn off ACK_REQ: 0x04 and EXPECTED_DONE: 0x20 */ 45562306a36Sopenharmony_ci hdr->flags &= ~(0x04|0x20); 45662306a36Sopenharmony_ci } else { 45762306a36Sopenharmony_ci /* turn off extra bytes: 20-21 bits */ 45862306a36Sopenharmony_ci hdr->bth[0] = cpu_to_be32(be32_to_cpu(hdr->bth[0])&0xFFCFFFFF); 45962306a36Sopenharmony_ci /* turn off ACK_REQ: 0x04 */ 46062306a36Sopenharmony_ci hdr->flags &= ~(0x04); 46162306a36Sopenharmony_ci } 46262306a36Sopenharmony_ci 46362306a36Sopenharmony_ci /* New kdeth checksum */ 46462306a36Sopenharmony_ci vcto = le32_to_cpu(hdr->iph.ver_ctxt_tid_offset); 46562306a36Sopenharmony_ci hdr->iph.chksum = cpu_to_le16(QIB_LRH_BTH + 46662306a36Sopenharmony_ci be16_to_cpu(hdr->lrh[2]) - 46762306a36Sopenharmony_ci ((vcto>>16)&0xFFFF) - (vcto&0xFFFF) - 46862306a36Sopenharmony_ci le16_to_cpu(hdr->iph.pkt_flags)); 46962306a36Sopenharmony_ci 47062306a36Sopenharmony_ci /* The packet is done, header is not dma mapped yet. 47162306a36Sopenharmony_ci * it should be from kmalloc */ 47262306a36Sopenharmony_ci if (!pkt->addr[pkt->index].addr) { 47362306a36Sopenharmony_ci pkt->addr[pkt->index].addr = 47462306a36Sopenharmony_ci dma_map_single(&dd->pcidev->dev, 47562306a36Sopenharmony_ci pkt->addr[pkt->index].kvaddr, 47662306a36Sopenharmony_ci pkt->addr[pkt->index].dma_length, 47762306a36Sopenharmony_ci DMA_TO_DEVICE); 47862306a36Sopenharmony_ci if (dma_mapping_error(&dd->pcidev->dev, 47962306a36Sopenharmony_ci pkt->addr[pkt->index].addr)) { 48062306a36Sopenharmony_ci ret = -ENOMEM; 48162306a36Sopenharmony_ci goto done; 48262306a36Sopenharmony_ci } 48362306a36Sopenharmony_ci pkt->addr[pkt->index].dma_mapped = 1; 48462306a36Sopenharmony_ci } 48562306a36Sopenharmony_ci 48662306a36Sopenharmony_ci /* Modify the new sdma header */ 48762306a36Sopenharmony_ci pbc16 = (__le16 *)pbcvaddr; 48862306a36Sopenharmony_ci hdr = (struct qib_message_header *)&pbc16[4]; 48962306a36Sopenharmony_ci 49062306a36Sopenharmony_ci /* New pbc length */ 49162306a36Sopenharmony_ci pbc16[0] = cpu_to_le16(le16_to_cpu(pbc16[0])-(pkt->payload_size>>2)); 49262306a36Sopenharmony_ci 49362306a36Sopenharmony_ci /* New packet length */ 49462306a36Sopenharmony_ci hdr->lrh[2] = cpu_to_be16(le16_to_cpu(pbc16[0])); 49562306a36Sopenharmony_ci 49662306a36Sopenharmony_ci if (pkt->tiddma) { 49762306a36Sopenharmony_ci /* Set new tid and offset for new sdma header */ 49862306a36Sopenharmony_ci hdr->iph.ver_ctxt_tid_offset = cpu_to_le32( 49962306a36Sopenharmony_ci (le32_to_cpu(hdr->iph.ver_ctxt_tid_offset)&0xFF000000) + 50062306a36Sopenharmony_ci (pkt->tidsm[pkt->tidsmidx].tid<<QLOGIC_IB_I_TID_SHIFT) + 50162306a36Sopenharmony_ci (pkt->tidsm[pkt->tidsmidx].offset>>2)); 50262306a36Sopenharmony_ci } else { 50362306a36Sopenharmony_ci /* Middle protocol new packet offset */ 50462306a36Sopenharmony_ci hdr->uwords[2] += pkt->payload_size; 50562306a36Sopenharmony_ci } 50662306a36Sopenharmony_ci 50762306a36Sopenharmony_ci /* New kdeth checksum */ 50862306a36Sopenharmony_ci vcto = le32_to_cpu(hdr->iph.ver_ctxt_tid_offset); 50962306a36Sopenharmony_ci hdr->iph.chksum = cpu_to_le16(QIB_LRH_BTH + 51062306a36Sopenharmony_ci be16_to_cpu(hdr->lrh[2]) - 51162306a36Sopenharmony_ci ((vcto>>16)&0xFFFF) - (vcto&0xFFFF) - 51262306a36Sopenharmony_ci le16_to_cpu(hdr->iph.pkt_flags)); 51362306a36Sopenharmony_ci 51462306a36Sopenharmony_ci /* Next sequence number in new sdma header */ 51562306a36Sopenharmony_ci seqnum.val = be32_to_cpu(hdr->bth[2]); 51662306a36Sopenharmony_ci if (pkt->tiddma) 51762306a36Sopenharmony_ci seqnum.seq++; 51862306a36Sopenharmony_ci else 51962306a36Sopenharmony_ci seqnum.pkt++; 52062306a36Sopenharmony_ci hdr->bth[2] = cpu_to_be32(seqnum.val); 52162306a36Sopenharmony_ci 52262306a36Sopenharmony_ci /* Init new sdma header. */ 52362306a36Sopenharmony_ci qib_user_sdma_init_frag(pkt, pkt->naddr, /* index */ 52462306a36Sopenharmony_ci 0, pbclen, /* offset, len */ 52562306a36Sopenharmony_ci 1, 0, /* first last desc */ 52662306a36Sopenharmony_ci 0, 0, /* put page, dma mapped */ 52762306a36Sopenharmony_ci NULL, pbcvaddr, /* struct page, virt addr */ 52862306a36Sopenharmony_ci pbcdaddr, pbclen); /* dma addr, dma length */ 52962306a36Sopenharmony_ci pkt->index = pkt->naddr; 53062306a36Sopenharmony_ci pkt->payload_size = 0; 53162306a36Sopenharmony_ci pkt->naddr++; 53262306a36Sopenharmony_ci if (pkt->naddr == pkt->addrlimit) { 53362306a36Sopenharmony_ci ret = -EFAULT; 53462306a36Sopenharmony_ci goto done; 53562306a36Sopenharmony_ci } 53662306a36Sopenharmony_ci 53762306a36Sopenharmony_ci /* Prepare for next fragment in this page */ 53862306a36Sopenharmony_ci if (newlen != len) { 53962306a36Sopenharmony_ci if (dma_mapped) { 54062306a36Sopenharmony_ci put = 0; 54162306a36Sopenharmony_ci dma_mapped = 0; 54262306a36Sopenharmony_ci page = NULL; 54362306a36Sopenharmony_ci kvaddr = NULL; 54462306a36Sopenharmony_ci } 54562306a36Sopenharmony_ci len -= newlen; 54662306a36Sopenharmony_ci offset += newlen; 54762306a36Sopenharmony_ci 54862306a36Sopenharmony_ci goto next_fragment; 54962306a36Sopenharmony_ci } 55062306a36Sopenharmony_ci 55162306a36Sopenharmony_cidone: 55262306a36Sopenharmony_ci return ret; 55362306a36Sopenharmony_ci} 55462306a36Sopenharmony_ci 55562306a36Sopenharmony_ci/* we've too many pages in the iovec, coalesce to a single page */ 55662306a36Sopenharmony_cistatic int qib_user_sdma_coalesce(const struct qib_devdata *dd, 55762306a36Sopenharmony_ci struct qib_user_sdma_queue *pq, 55862306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt, 55962306a36Sopenharmony_ci const struct iovec *iov, 56062306a36Sopenharmony_ci unsigned long niov) 56162306a36Sopenharmony_ci{ 56262306a36Sopenharmony_ci int ret = 0; 56362306a36Sopenharmony_ci struct page *page = alloc_page(GFP_KERNEL); 56462306a36Sopenharmony_ci void *mpage_save; 56562306a36Sopenharmony_ci char *mpage; 56662306a36Sopenharmony_ci int i; 56762306a36Sopenharmony_ci int len = 0; 56862306a36Sopenharmony_ci 56962306a36Sopenharmony_ci if (!page) { 57062306a36Sopenharmony_ci ret = -ENOMEM; 57162306a36Sopenharmony_ci goto done; 57262306a36Sopenharmony_ci } 57362306a36Sopenharmony_ci 57462306a36Sopenharmony_ci mpage = page_address(page); 57562306a36Sopenharmony_ci mpage_save = mpage; 57662306a36Sopenharmony_ci for (i = 0; i < niov; i++) { 57762306a36Sopenharmony_ci int cfur; 57862306a36Sopenharmony_ci 57962306a36Sopenharmony_ci cfur = copy_from_user(mpage, 58062306a36Sopenharmony_ci iov[i].iov_base, iov[i].iov_len); 58162306a36Sopenharmony_ci if (cfur) { 58262306a36Sopenharmony_ci ret = -EFAULT; 58362306a36Sopenharmony_ci goto page_free; 58462306a36Sopenharmony_ci } 58562306a36Sopenharmony_ci 58662306a36Sopenharmony_ci mpage += iov[i].iov_len; 58762306a36Sopenharmony_ci len += iov[i].iov_len; 58862306a36Sopenharmony_ci } 58962306a36Sopenharmony_ci 59062306a36Sopenharmony_ci ret = qib_user_sdma_page_to_frags(dd, pq, pkt, 59162306a36Sopenharmony_ci page, 0, 0, len, mpage_save); 59262306a36Sopenharmony_ci goto done; 59362306a36Sopenharmony_ci 59462306a36Sopenharmony_cipage_free: 59562306a36Sopenharmony_ci __free_page(page); 59662306a36Sopenharmony_cidone: 59762306a36Sopenharmony_ci return ret; 59862306a36Sopenharmony_ci} 59962306a36Sopenharmony_ci 60062306a36Sopenharmony_ci/* 60162306a36Sopenharmony_ci * How many pages in this iovec element? 60262306a36Sopenharmony_ci */ 60362306a36Sopenharmony_cistatic size_t qib_user_sdma_num_pages(const struct iovec *iov) 60462306a36Sopenharmony_ci{ 60562306a36Sopenharmony_ci const unsigned long addr = (unsigned long) iov->iov_base; 60662306a36Sopenharmony_ci const unsigned long len = iov->iov_len; 60762306a36Sopenharmony_ci const unsigned long spage = addr & PAGE_MASK; 60862306a36Sopenharmony_ci const unsigned long epage = (addr + len - 1) & PAGE_MASK; 60962306a36Sopenharmony_ci 61062306a36Sopenharmony_ci return 1 + ((epage - spage) >> PAGE_SHIFT); 61162306a36Sopenharmony_ci} 61262306a36Sopenharmony_ci 61362306a36Sopenharmony_cistatic void qib_user_sdma_free_pkt_frag(struct device *dev, 61462306a36Sopenharmony_ci struct qib_user_sdma_queue *pq, 61562306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt, 61662306a36Sopenharmony_ci int frag) 61762306a36Sopenharmony_ci{ 61862306a36Sopenharmony_ci const int i = frag; 61962306a36Sopenharmony_ci 62062306a36Sopenharmony_ci if (pkt->addr[i].page) { 62162306a36Sopenharmony_ci /* only user data has page */ 62262306a36Sopenharmony_ci if (pkt->addr[i].dma_mapped) 62362306a36Sopenharmony_ci dma_unmap_page(dev, 62462306a36Sopenharmony_ci pkt->addr[i].addr, 62562306a36Sopenharmony_ci pkt->addr[i].dma_length, 62662306a36Sopenharmony_ci DMA_TO_DEVICE); 62762306a36Sopenharmony_ci 62862306a36Sopenharmony_ci if (pkt->addr[i].put_page) 62962306a36Sopenharmony_ci unpin_user_page(pkt->addr[i].page); 63062306a36Sopenharmony_ci else 63162306a36Sopenharmony_ci __free_page(pkt->addr[i].page); 63262306a36Sopenharmony_ci } else if (pkt->addr[i].kvaddr) { 63362306a36Sopenharmony_ci /* for headers */ 63462306a36Sopenharmony_ci if (pkt->addr[i].dma_mapped) { 63562306a36Sopenharmony_ci /* from kmalloc & dma mapped */ 63662306a36Sopenharmony_ci dma_unmap_single(dev, 63762306a36Sopenharmony_ci pkt->addr[i].addr, 63862306a36Sopenharmony_ci pkt->addr[i].dma_length, 63962306a36Sopenharmony_ci DMA_TO_DEVICE); 64062306a36Sopenharmony_ci kfree(pkt->addr[i].kvaddr); 64162306a36Sopenharmony_ci } else if (pkt->addr[i].addr) { 64262306a36Sopenharmony_ci /* free coherent mem from cache... */ 64362306a36Sopenharmony_ci dma_pool_free(pq->header_cache, 64462306a36Sopenharmony_ci pkt->addr[i].kvaddr, pkt->addr[i].addr); 64562306a36Sopenharmony_ci } else { 64662306a36Sopenharmony_ci /* from kmalloc but not dma mapped */ 64762306a36Sopenharmony_ci kfree(pkt->addr[i].kvaddr); 64862306a36Sopenharmony_ci } 64962306a36Sopenharmony_ci } 65062306a36Sopenharmony_ci} 65162306a36Sopenharmony_ci 65262306a36Sopenharmony_ci/* return number of pages pinned... */ 65362306a36Sopenharmony_cistatic int qib_user_sdma_pin_pages(const struct qib_devdata *dd, 65462306a36Sopenharmony_ci struct qib_user_sdma_queue *pq, 65562306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt, 65662306a36Sopenharmony_ci unsigned long addr, int tlen, size_t npages) 65762306a36Sopenharmony_ci{ 65862306a36Sopenharmony_ci struct page *pages[8]; 65962306a36Sopenharmony_ci int i, j; 66062306a36Sopenharmony_ci int ret = 0; 66162306a36Sopenharmony_ci 66262306a36Sopenharmony_ci while (npages) { 66362306a36Sopenharmony_ci if (npages > 8) 66462306a36Sopenharmony_ci j = 8; 66562306a36Sopenharmony_ci else 66662306a36Sopenharmony_ci j = npages; 66762306a36Sopenharmony_ci 66862306a36Sopenharmony_ci ret = pin_user_pages_fast(addr, j, FOLL_LONGTERM, pages); 66962306a36Sopenharmony_ci if (ret != j) { 67062306a36Sopenharmony_ci i = 0; 67162306a36Sopenharmony_ci j = ret; 67262306a36Sopenharmony_ci ret = -ENOMEM; 67362306a36Sopenharmony_ci goto free_pages; 67462306a36Sopenharmony_ci } 67562306a36Sopenharmony_ci 67662306a36Sopenharmony_ci for (i = 0; i < j; i++) { 67762306a36Sopenharmony_ci /* map the pages... */ 67862306a36Sopenharmony_ci unsigned long fofs = addr & ~PAGE_MASK; 67962306a36Sopenharmony_ci int flen = ((fofs + tlen) > PAGE_SIZE) ? 68062306a36Sopenharmony_ci (PAGE_SIZE - fofs) : tlen; 68162306a36Sopenharmony_ci 68262306a36Sopenharmony_ci ret = qib_user_sdma_page_to_frags(dd, pq, pkt, 68362306a36Sopenharmony_ci pages[i], 1, fofs, flen, NULL); 68462306a36Sopenharmony_ci if (ret < 0) { 68562306a36Sopenharmony_ci /* current page has beed taken 68662306a36Sopenharmony_ci * care of inside above call. 68762306a36Sopenharmony_ci */ 68862306a36Sopenharmony_ci i++; 68962306a36Sopenharmony_ci goto free_pages; 69062306a36Sopenharmony_ci } 69162306a36Sopenharmony_ci 69262306a36Sopenharmony_ci addr += flen; 69362306a36Sopenharmony_ci tlen -= flen; 69462306a36Sopenharmony_ci } 69562306a36Sopenharmony_ci 69662306a36Sopenharmony_ci npages -= j; 69762306a36Sopenharmony_ci } 69862306a36Sopenharmony_ci 69962306a36Sopenharmony_ci goto done; 70062306a36Sopenharmony_ci 70162306a36Sopenharmony_ci /* if error, return all pages not managed by pkt */ 70262306a36Sopenharmony_cifree_pages: 70362306a36Sopenharmony_ci while (i < j) 70462306a36Sopenharmony_ci unpin_user_page(pages[i++]); 70562306a36Sopenharmony_ci 70662306a36Sopenharmony_cidone: 70762306a36Sopenharmony_ci return ret; 70862306a36Sopenharmony_ci} 70962306a36Sopenharmony_ci 71062306a36Sopenharmony_cistatic int qib_user_sdma_pin_pkt(const struct qib_devdata *dd, 71162306a36Sopenharmony_ci struct qib_user_sdma_queue *pq, 71262306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt, 71362306a36Sopenharmony_ci const struct iovec *iov, 71462306a36Sopenharmony_ci unsigned long niov) 71562306a36Sopenharmony_ci{ 71662306a36Sopenharmony_ci int ret = 0; 71762306a36Sopenharmony_ci unsigned long idx; 71862306a36Sopenharmony_ci 71962306a36Sopenharmony_ci for (idx = 0; idx < niov; idx++) { 72062306a36Sopenharmony_ci const size_t npages = qib_user_sdma_num_pages(iov + idx); 72162306a36Sopenharmony_ci const unsigned long addr = (unsigned long) iov[idx].iov_base; 72262306a36Sopenharmony_ci 72362306a36Sopenharmony_ci ret = qib_user_sdma_pin_pages(dd, pq, pkt, addr, 72462306a36Sopenharmony_ci iov[idx].iov_len, npages); 72562306a36Sopenharmony_ci if (ret < 0) 72662306a36Sopenharmony_ci goto free_pkt; 72762306a36Sopenharmony_ci } 72862306a36Sopenharmony_ci 72962306a36Sopenharmony_ci goto done; 73062306a36Sopenharmony_ci 73162306a36Sopenharmony_cifree_pkt: 73262306a36Sopenharmony_ci /* we need to ignore the first entry here */ 73362306a36Sopenharmony_ci for (idx = 1; idx < pkt->naddr; idx++) 73462306a36Sopenharmony_ci qib_user_sdma_free_pkt_frag(&dd->pcidev->dev, pq, pkt, idx); 73562306a36Sopenharmony_ci 73662306a36Sopenharmony_ci /* need to dma unmap the first entry, this is to restore to 73762306a36Sopenharmony_ci * the original state so that caller can free the memory in 73862306a36Sopenharmony_ci * error condition. Caller does not know if dma mapped or not*/ 73962306a36Sopenharmony_ci if (pkt->addr[0].dma_mapped) { 74062306a36Sopenharmony_ci dma_unmap_single(&dd->pcidev->dev, 74162306a36Sopenharmony_ci pkt->addr[0].addr, 74262306a36Sopenharmony_ci pkt->addr[0].dma_length, 74362306a36Sopenharmony_ci DMA_TO_DEVICE); 74462306a36Sopenharmony_ci pkt->addr[0].addr = 0; 74562306a36Sopenharmony_ci pkt->addr[0].dma_mapped = 0; 74662306a36Sopenharmony_ci } 74762306a36Sopenharmony_ci 74862306a36Sopenharmony_cidone: 74962306a36Sopenharmony_ci return ret; 75062306a36Sopenharmony_ci} 75162306a36Sopenharmony_ci 75262306a36Sopenharmony_cistatic int qib_user_sdma_init_payload(const struct qib_devdata *dd, 75362306a36Sopenharmony_ci struct qib_user_sdma_queue *pq, 75462306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt, 75562306a36Sopenharmony_ci const struct iovec *iov, 75662306a36Sopenharmony_ci unsigned long niov, int npages) 75762306a36Sopenharmony_ci{ 75862306a36Sopenharmony_ci int ret = 0; 75962306a36Sopenharmony_ci 76062306a36Sopenharmony_ci if (pkt->frag_size == pkt->bytes_togo && 76162306a36Sopenharmony_ci npages >= ARRAY_SIZE(pkt->addr)) 76262306a36Sopenharmony_ci ret = qib_user_sdma_coalesce(dd, pq, pkt, iov, niov); 76362306a36Sopenharmony_ci else 76462306a36Sopenharmony_ci ret = qib_user_sdma_pin_pkt(dd, pq, pkt, iov, niov); 76562306a36Sopenharmony_ci 76662306a36Sopenharmony_ci return ret; 76762306a36Sopenharmony_ci} 76862306a36Sopenharmony_ci 76962306a36Sopenharmony_ci/* free a packet list -- return counter value of last packet */ 77062306a36Sopenharmony_cistatic void qib_user_sdma_free_pkt_list(struct device *dev, 77162306a36Sopenharmony_ci struct qib_user_sdma_queue *pq, 77262306a36Sopenharmony_ci struct list_head *list) 77362306a36Sopenharmony_ci{ 77462306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt, *pkt_next; 77562306a36Sopenharmony_ci 77662306a36Sopenharmony_ci list_for_each_entry_safe(pkt, pkt_next, list, list) { 77762306a36Sopenharmony_ci int i; 77862306a36Sopenharmony_ci 77962306a36Sopenharmony_ci for (i = 0; i < pkt->naddr; i++) 78062306a36Sopenharmony_ci qib_user_sdma_free_pkt_frag(dev, pq, pkt, i); 78162306a36Sopenharmony_ci 78262306a36Sopenharmony_ci if (pkt->largepkt) 78362306a36Sopenharmony_ci kfree(pkt); 78462306a36Sopenharmony_ci else 78562306a36Sopenharmony_ci kmem_cache_free(pq->pkt_slab, pkt); 78662306a36Sopenharmony_ci } 78762306a36Sopenharmony_ci INIT_LIST_HEAD(list); 78862306a36Sopenharmony_ci} 78962306a36Sopenharmony_ci 79062306a36Sopenharmony_ci/* 79162306a36Sopenharmony_ci * copy headers, coalesce etc -- pq->lock must be held 79262306a36Sopenharmony_ci * 79362306a36Sopenharmony_ci * we queue all the packets to list, returning the 79462306a36Sopenharmony_ci * number of bytes total. list must be empty initially, 79562306a36Sopenharmony_ci * as, if there is an error we clean it... 79662306a36Sopenharmony_ci */ 79762306a36Sopenharmony_cistatic int qib_user_sdma_queue_pkts(const struct qib_devdata *dd, 79862306a36Sopenharmony_ci struct qib_pportdata *ppd, 79962306a36Sopenharmony_ci struct qib_user_sdma_queue *pq, 80062306a36Sopenharmony_ci const struct iovec *iov, 80162306a36Sopenharmony_ci unsigned long niov, 80262306a36Sopenharmony_ci struct list_head *list, 80362306a36Sopenharmony_ci int *maxpkts, int *ndesc) 80462306a36Sopenharmony_ci{ 80562306a36Sopenharmony_ci unsigned long idx = 0; 80662306a36Sopenharmony_ci int ret = 0; 80762306a36Sopenharmony_ci int npkts = 0; 80862306a36Sopenharmony_ci __le32 *pbc; 80962306a36Sopenharmony_ci dma_addr_t dma_addr; 81062306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt = NULL; 81162306a36Sopenharmony_ci size_t len; 81262306a36Sopenharmony_ci size_t nw; 81362306a36Sopenharmony_ci u32 counter = pq->counter; 81462306a36Sopenharmony_ci u16 frag_size; 81562306a36Sopenharmony_ci 81662306a36Sopenharmony_ci while (idx < niov && npkts < *maxpkts) { 81762306a36Sopenharmony_ci const unsigned long addr = (unsigned long) iov[idx].iov_base; 81862306a36Sopenharmony_ci const unsigned long idx_save = idx; 81962306a36Sopenharmony_ci unsigned pktnw; 82062306a36Sopenharmony_ci unsigned pktnwc; 82162306a36Sopenharmony_ci int nfrags = 0; 82262306a36Sopenharmony_ci size_t npages = 0; 82362306a36Sopenharmony_ci size_t bytes_togo = 0; 82462306a36Sopenharmony_ci int tiddma = 0; 82562306a36Sopenharmony_ci int cfur; 82662306a36Sopenharmony_ci 82762306a36Sopenharmony_ci len = iov[idx].iov_len; 82862306a36Sopenharmony_ci nw = len >> 2; 82962306a36Sopenharmony_ci 83062306a36Sopenharmony_ci if (len < QIB_USER_SDMA_MIN_HEADER_LENGTH || 83162306a36Sopenharmony_ci len > PAGE_SIZE || len & 3 || addr & 3) { 83262306a36Sopenharmony_ci ret = -EINVAL; 83362306a36Sopenharmony_ci goto free_list; 83462306a36Sopenharmony_ci } 83562306a36Sopenharmony_ci 83662306a36Sopenharmony_ci pbc = qib_user_sdma_alloc_header(pq, len, &dma_addr); 83762306a36Sopenharmony_ci if (!pbc) { 83862306a36Sopenharmony_ci ret = -ENOMEM; 83962306a36Sopenharmony_ci goto free_list; 84062306a36Sopenharmony_ci } 84162306a36Sopenharmony_ci 84262306a36Sopenharmony_ci cfur = copy_from_user(pbc, iov[idx].iov_base, len); 84362306a36Sopenharmony_ci if (cfur) { 84462306a36Sopenharmony_ci ret = -EFAULT; 84562306a36Sopenharmony_ci goto free_pbc; 84662306a36Sopenharmony_ci } 84762306a36Sopenharmony_ci 84862306a36Sopenharmony_ci /* 84962306a36Sopenharmony_ci * This assignment is a bit strange. it's because 85062306a36Sopenharmony_ci * the pbc counts the number of 32 bit words in the full 85162306a36Sopenharmony_ci * packet _except_ the first word of the pbc itself... 85262306a36Sopenharmony_ci */ 85362306a36Sopenharmony_ci pktnwc = nw - 1; 85462306a36Sopenharmony_ci 85562306a36Sopenharmony_ci /* 85662306a36Sopenharmony_ci * pktnw computation yields the number of 32 bit words 85762306a36Sopenharmony_ci * that the caller has indicated in the PBC. note that 85862306a36Sopenharmony_ci * this is one less than the total number of words that 85962306a36Sopenharmony_ci * goes to the send DMA engine as the first 32 bit word 86062306a36Sopenharmony_ci * of the PBC itself is not counted. Armed with this count, 86162306a36Sopenharmony_ci * we can verify that the packet is consistent with the 86262306a36Sopenharmony_ci * iovec lengths. 86362306a36Sopenharmony_ci */ 86462306a36Sopenharmony_ci pktnw = le32_to_cpu(*pbc) & 0xFFFF; 86562306a36Sopenharmony_ci if (pktnw < pktnwc) { 86662306a36Sopenharmony_ci ret = -EINVAL; 86762306a36Sopenharmony_ci goto free_pbc; 86862306a36Sopenharmony_ci } 86962306a36Sopenharmony_ci 87062306a36Sopenharmony_ci idx++; 87162306a36Sopenharmony_ci while (pktnwc < pktnw && idx < niov) { 87262306a36Sopenharmony_ci const size_t slen = iov[idx].iov_len; 87362306a36Sopenharmony_ci const unsigned long faddr = 87462306a36Sopenharmony_ci (unsigned long) iov[idx].iov_base; 87562306a36Sopenharmony_ci 87662306a36Sopenharmony_ci if (slen & 3 || faddr & 3 || !slen) { 87762306a36Sopenharmony_ci ret = -EINVAL; 87862306a36Sopenharmony_ci goto free_pbc; 87962306a36Sopenharmony_ci } 88062306a36Sopenharmony_ci 88162306a36Sopenharmony_ci npages += qib_user_sdma_num_pages(&iov[idx]); 88262306a36Sopenharmony_ci 88362306a36Sopenharmony_ci if (check_add_overflow(bytes_togo, slen, &bytes_togo) || 88462306a36Sopenharmony_ci bytes_togo > type_max(typeof(pkt->bytes_togo))) { 88562306a36Sopenharmony_ci ret = -EINVAL; 88662306a36Sopenharmony_ci goto free_pbc; 88762306a36Sopenharmony_ci } 88862306a36Sopenharmony_ci pktnwc += slen >> 2; 88962306a36Sopenharmony_ci idx++; 89062306a36Sopenharmony_ci nfrags++; 89162306a36Sopenharmony_ci } 89262306a36Sopenharmony_ci 89362306a36Sopenharmony_ci if (pktnwc != pktnw) { 89462306a36Sopenharmony_ci ret = -EINVAL; 89562306a36Sopenharmony_ci goto free_pbc; 89662306a36Sopenharmony_ci } 89762306a36Sopenharmony_ci 89862306a36Sopenharmony_ci frag_size = ((le32_to_cpu(*pbc))>>16) & 0xFFFF; 89962306a36Sopenharmony_ci if (((frag_size ? frag_size : bytes_togo) + len) > 90062306a36Sopenharmony_ci ppd->ibmaxlen) { 90162306a36Sopenharmony_ci ret = -EINVAL; 90262306a36Sopenharmony_ci goto free_pbc; 90362306a36Sopenharmony_ci } 90462306a36Sopenharmony_ci 90562306a36Sopenharmony_ci if (frag_size) { 90662306a36Sopenharmony_ci size_t tidsmsize, n, pktsize, sz, addrlimit; 90762306a36Sopenharmony_ci 90862306a36Sopenharmony_ci n = npages*((2*PAGE_SIZE/frag_size)+1); 90962306a36Sopenharmony_ci pktsize = struct_size(pkt, addr, n); 91062306a36Sopenharmony_ci 91162306a36Sopenharmony_ci /* 91262306a36Sopenharmony_ci * Determine if this is tid-sdma or just sdma. 91362306a36Sopenharmony_ci */ 91462306a36Sopenharmony_ci tiddma = (((le32_to_cpu(pbc[7])>> 91562306a36Sopenharmony_ci QLOGIC_IB_I_TID_SHIFT)& 91662306a36Sopenharmony_ci QLOGIC_IB_I_TID_MASK) != 91762306a36Sopenharmony_ci QLOGIC_IB_I_TID_MASK); 91862306a36Sopenharmony_ci 91962306a36Sopenharmony_ci if (tiddma) 92062306a36Sopenharmony_ci tidsmsize = iov[idx].iov_len; 92162306a36Sopenharmony_ci else 92262306a36Sopenharmony_ci tidsmsize = 0; 92362306a36Sopenharmony_ci 92462306a36Sopenharmony_ci if (check_add_overflow(pktsize, tidsmsize, &sz)) { 92562306a36Sopenharmony_ci ret = -EINVAL; 92662306a36Sopenharmony_ci goto free_pbc; 92762306a36Sopenharmony_ci } 92862306a36Sopenharmony_ci pkt = kmalloc(sz, GFP_KERNEL); 92962306a36Sopenharmony_ci if (!pkt) { 93062306a36Sopenharmony_ci ret = -ENOMEM; 93162306a36Sopenharmony_ci goto free_pbc; 93262306a36Sopenharmony_ci } 93362306a36Sopenharmony_ci pkt->largepkt = 1; 93462306a36Sopenharmony_ci pkt->frag_size = frag_size; 93562306a36Sopenharmony_ci if (check_add_overflow(n, ARRAY_SIZE(pkt->addr), 93662306a36Sopenharmony_ci &addrlimit) || 93762306a36Sopenharmony_ci addrlimit > type_max(typeof(pkt->addrlimit))) { 93862306a36Sopenharmony_ci ret = -EINVAL; 93962306a36Sopenharmony_ci goto free_pkt; 94062306a36Sopenharmony_ci } 94162306a36Sopenharmony_ci pkt->addrlimit = addrlimit; 94262306a36Sopenharmony_ci 94362306a36Sopenharmony_ci if (tiddma) { 94462306a36Sopenharmony_ci char *tidsm = (char *)pkt + pktsize; 94562306a36Sopenharmony_ci 94662306a36Sopenharmony_ci cfur = copy_from_user(tidsm, 94762306a36Sopenharmony_ci iov[idx].iov_base, tidsmsize); 94862306a36Sopenharmony_ci if (cfur) { 94962306a36Sopenharmony_ci ret = -EFAULT; 95062306a36Sopenharmony_ci goto free_pkt; 95162306a36Sopenharmony_ci } 95262306a36Sopenharmony_ci pkt->tidsm = 95362306a36Sopenharmony_ci (struct qib_tid_session_member *)tidsm; 95462306a36Sopenharmony_ci pkt->tidsmcount = tidsmsize/ 95562306a36Sopenharmony_ci sizeof(struct qib_tid_session_member); 95662306a36Sopenharmony_ci pkt->tidsmidx = 0; 95762306a36Sopenharmony_ci idx++; 95862306a36Sopenharmony_ci } 95962306a36Sopenharmony_ci 96062306a36Sopenharmony_ci /* 96162306a36Sopenharmony_ci * pbc 'fill1' field is borrowed to pass frag size, 96262306a36Sopenharmony_ci * we need to clear it after picking frag size, the 96362306a36Sopenharmony_ci * hardware requires this field to be zero. 96462306a36Sopenharmony_ci */ 96562306a36Sopenharmony_ci *pbc = cpu_to_le32(le32_to_cpu(*pbc) & 0x0000FFFF); 96662306a36Sopenharmony_ci } else { 96762306a36Sopenharmony_ci pkt = kmem_cache_alloc(pq->pkt_slab, GFP_KERNEL); 96862306a36Sopenharmony_ci if (!pkt) { 96962306a36Sopenharmony_ci ret = -ENOMEM; 97062306a36Sopenharmony_ci goto free_pbc; 97162306a36Sopenharmony_ci } 97262306a36Sopenharmony_ci pkt->largepkt = 0; 97362306a36Sopenharmony_ci pkt->frag_size = bytes_togo; 97462306a36Sopenharmony_ci pkt->addrlimit = ARRAY_SIZE(pkt->addr); 97562306a36Sopenharmony_ci } 97662306a36Sopenharmony_ci pkt->bytes_togo = bytes_togo; 97762306a36Sopenharmony_ci pkt->payload_size = 0; 97862306a36Sopenharmony_ci pkt->counter = counter; 97962306a36Sopenharmony_ci pkt->tiddma = tiddma; 98062306a36Sopenharmony_ci 98162306a36Sopenharmony_ci /* setup the first header */ 98262306a36Sopenharmony_ci qib_user_sdma_init_frag(pkt, 0, /* index */ 98362306a36Sopenharmony_ci 0, len, /* offset, len */ 98462306a36Sopenharmony_ci 1, 0, /* first last desc */ 98562306a36Sopenharmony_ci 0, 0, /* put page, dma mapped */ 98662306a36Sopenharmony_ci NULL, pbc, /* struct page, virt addr */ 98762306a36Sopenharmony_ci dma_addr, len); /* dma addr, dma length */ 98862306a36Sopenharmony_ci pkt->index = 0; 98962306a36Sopenharmony_ci pkt->naddr = 1; 99062306a36Sopenharmony_ci 99162306a36Sopenharmony_ci if (nfrags) { 99262306a36Sopenharmony_ci ret = qib_user_sdma_init_payload(dd, pq, pkt, 99362306a36Sopenharmony_ci iov + idx_save + 1, 99462306a36Sopenharmony_ci nfrags, npages); 99562306a36Sopenharmony_ci if (ret < 0) 99662306a36Sopenharmony_ci goto free_pkt; 99762306a36Sopenharmony_ci } else { 99862306a36Sopenharmony_ci /* since there is no payload, mark the 99962306a36Sopenharmony_ci * header as the last desc. */ 100062306a36Sopenharmony_ci pkt->addr[0].last_desc = 1; 100162306a36Sopenharmony_ci 100262306a36Sopenharmony_ci if (dma_addr == 0) { 100362306a36Sopenharmony_ci /* 100462306a36Sopenharmony_ci * the header is not dma mapped yet. 100562306a36Sopenharmony_ci * it should be from kmalloc. 100662306a36Sopenharmony_ci */ 100762306a36Sopenharmony_ci dma_addr = dma_map_single(&dd->pcidev->dev, 100862306a36Sopenharmony_ci pbc, len, DMA_TO_DEVICE); 100962306a36Sopenharmony_ci if (dma_mapping_error(&dd->pcidev->dev, 101062306a36Sopenharmony_ci dma_addr)) { 101162306a36Sopenharmony_ci ret = -ENOMEM; 101262306a36Sopenharmony_ci goto free_pkt; 101362306a36Sopenharmony_ci } 101462306a36Sopenharmony_ci pkt->addr[0].addr = dma_addr; 101562306a36Sopenharmony_ci pkt->addr[0].dma_mapped = 1; 101662306a36Sopenharmony_ci } 101762306a36Sopenharmony_ci } 101862306a36Sopenharmony_ci 101962306a36Sopenharmony_ci counter++; 102062306a36Sopenharmony_ci npkts++; 102162306a36Sopenharmony_ci pkt->pq = pq; 102262306a36Sopenharmony_ci pkt->index = 0; /* reset index for push on hw */ 102362306a36Sopenharmony_ci *ndesc += pkt->naddr; 102462306a36Sopenharmony_ci 102562306a36Sopenharmony_ci list_add_tail(&pkt->list, list); 102662306a36Sopenharmony_ci } 102762306a36Sopenharmony_ci 102862306a36Sopenharmony_ci *maxpkts = npkts; 102962306a36Sopenharmony_ci ret = idx; 103062306a36Sopenharmony_ci goto done; 103162306a36Sopenharmony_ci 103262306a36Sopenharmony_cifree_pkt: 103362306a36Sopenharmony_ci if (pkt->largepkt) 103462306a36Sopenharmony_ci kfree(pkt); 103562306a36Sopenharmony_ci else 103662306a36Sopenharmony_ci kmem_cache_free(pq->pkt_slab, pkt); 103762306a36Sopenharmony_cifree_pbc: 103862306a36Sopenharmony_ci if (dma_addr) 103962306a36Sopenharmony_ci dma_pool_free(pq->header_cache, pbc, dma_addr); 104062306a36Sopenharmony_ci else 104162306a36Sopenharmony_ci kfree(pbc); 104262306a36Sopenharmony_cifree_list: 104362306a36Sopenharmony_ci qib_user_sdma_free_pkt_list(&dd->pcidev->dev, pq, list); 104462306a36Sopenharmony_cidone: 104562306a36Sopenharmony_ci return ret; 104662306a36Sopenharmony_ci} 104762306a36Sopenharmony_ci 104862306a36Sopenharmony_cistatic void qib_user_sdma_set_complete_counter(struct qib_user_sdma_queue *pq, 104962306a36Sopenharmony_ci u32 c) 105062306a36Sopenharmony_ci{ 105162306a36Sopenharmony_ci pq->sent_counter = c; 105262306a36Sopenharmony_ci} 105362306a36Sopenharmony_ci 105462306a36Sopenharmony_ci/* try to clean out queue -- needs pq->lock */ 105562306a36Sopenharmony_cistatic int qib_user_sdma_queue_clean(struct qib_pportdata *ppd, 105662306a36Sopenharmony_ci struct qib_user_sdma_queue *pq) 105762306a36Sopenharmony_ci{ 105862306a36Sopenharmony_ci struct qib_devdata *dd = ppd->dd; 105962306a36Sopenharmony_ci struct list_head free_list; 106062306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt; 106162306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt_prev; 106262306a36Sopenharmony_ci unsigned long flags; 106362306a36Sopenharmony_ci int ret = 0; 106462306a36Sopenharmony_ci 106562306a36Sopenharmony_ci if (!pq->num_sending) 106662306a36Sopenharmony_ci return 0; 106762306a36Sopenharmony_ci 106862306a36Sopenharmony_ci INIT_LIST_HEAD(&free_list); 106962306a36Sopenharmony_ci 107062306a36Sopenharmony_ci /* 107162306a36Sopenharmony_ci * We need this spin lock here because interrupt handler 107262306a36Sopenharmony_ci * might modify this list in qib_user_sdma_send_desc(), also 107362306a36Sopenharmony_ci * we can not get interrupted, otherwise it is a deadlock. 107462306a36Sopenharmony_ci */ 107562306a36Sopenharmony_ci spin_lock_irqsave(&pq->sent_lock, flags); 107662306a36Sopenharmony_ci list_for_each_entry_safe(pkt, pkt_prev, &pq->sent, list) { 107762306a36Sopenharmony_ci s64 descd = ppd->sdma_descq_removed - pkt->added; 107862306a36Sopenharmony_ci 107962306a36Sopenharmony_ci if (descd < 0) 108062306a36Sopenharmony_ci break; 108162306a36Sopenharmony_ci 108262306a36Sopenharmony_ci list_move_tail(&pkt->list, &free_list); 108362306a36Sopenharmony_ci 108462306a36Sopenharmony_ci /* one more packet cleaned */ 108562306a36Sopenharmony_ci ret++; 108662306a36Sopenharmony_ci pq->num_sending--; 108762306a36Sopenharmony_ci } 108862306a36Sopenharmony_ci spin_unlock_irqrestore(&pq->sent_lock, flags); 108962306a36Sopenharmony_ci 109062306a36Sopenharmony_ci if (!list_empty(&free_list)) { 109162306a36Sopenharmony_ci u32 counter; 109262306a36Sopenharmony_ci 109362306a36Sopenharmony_ci pkt = list_entry(free_list.prev, 109462306a36Sopenharmony_ci struct qib_user_sdma_pkt, list); 109562306a36Sopenharmony_ci counter = pkt->counter; 109662306a36Sopenharmony_ci 109762306a36Sopenharmony_ci qib_user_sdma_free_pkt_list(&dd->pcidev->dev, pq, &free_list); 109862306a36Sopenharmony_ci qib_user_sdma_set_complete_counter(pq, counter); 109962306a36Sopenharmony_ci } 110062306a36Sopenharmony_ci 110162306a36Sopenharmony_ci return ret; 110262306a36Sopenharmony_ci} 110362306a36Sopenharmony_ci 110462306a36Sopenharmony_civoid qib_user_sdma_queue_destroy(struct qib_user_sdma_queue *pq) 110562306a36Sopenharmony_ci{ 110662306a36Sopenharmony_ci if (!pq) 110762306a36Sopenharmony_ci return; 110862306a36Sopenharmony_ci 110962306a36Sopenharmony_ci pq->sdma_rb_node->refcount--; 111062306a36Sopenharmony_ci if (pq->sdma_rb_node->refcount == 0) { 111162306a36Sopenharmony_ci rb_erase(&pq->sdma_rb_node->node, &qib_user_sdma_rb_root); 111262306a36Sopenharmony_ci kfree(pq->sdma_rb_node); 111362306a36Sopenharmony_ci } 111462306a36Sopenharmony_ci dma_pool_destroy(pq->header_cache); 111562306a36Sopenharmony_ci kmem_cache_destroy(pq->pkt_slab); 111662306a36Sopenharmony_ci kfree(pq); 111762306a36Sopenharmony_ci} 111862306a36Sopenharmony_ci 111962306a36Sopenharmony_ci/* clean descriptor queue, returns > 0 if some elements cleaned */ 112062306a36Sopenharmony_cistatic int qib_user_sdma_hwqueue_clean(struct qib_pportdata *ppd) 112162306a36Sopenharmony_ci{ 112262306a36Sopenharmony_ci int ret; 112362306a36Sopenharmony_ci unsigned long flags; 112462306a36Sopenharmony_ci 112562306a36Sopenharmony_ci spin_lock_irqsave(&ppd->sdma_lock, flags); 112662306a36Sopenharmony_ci ret = qib_sdma_make_progress(ppd); 112762306a36Sopenharmony_ci spin_unlock_irqrestore(&ppd->sdma_lock, flags); 112862306a36Sopenharmony_ci 112962306a36Sopenharmony_ci return ret; 113062306a36Sopenharmony_ci} 113162306a36Sopenharmony_ci 113262306a36Sopenharmony_ci/* we're in close, drain packets so that we can cleanup successfully... */ 113362306a36Sopenharmony_civoid qib_user_sdma_queue_drain(struct qib_pportdata *ppd, 113462306a36Sopenharmony_ci struct qib_user_sdma_queue *pq) 113562306a36Sopenharmony_ci{ 113662306a36Sopenharmony_ci struct qib_devdata *dd = ppd->dd; 113762306a36Sopenharmony_ci unsigned long flags; 113862306a36Sopenharmony_ci int i; 113962306a36Sopenharmony_ci 114062306a36Sopenharmony_ci if (!pq) 114162306a36Sopenharmony_ci return; 114262306a36Sopenharmony_ci 114362306a36Sopenharmony_ci for (i = 0; i < QIB_USER_SDMA_DRAIN_TIMEOUT; i++) { 114462306a36Sopenharmony_ci mutex_lock(&pq->lock); 114562306a36Sopenharmony_ci if (!pq->num_pending && !pq->num_sending) { 114662306a36Sopenharmony_ci mutex_unlock(&pq->lock); 114762306a36Sopenharmony_ci break; 114862306a36Sopenharmony_ci } 114962306a36Sopenharmony_ci qib_user_sdma_hwqueue_clean(ppd); 115062306a36Sopenharmony_ci qib_user_sdma_queue_clean(ppd, pq); 115162306a36Sopenharmony_ci mutex_unlock(&pq->lock); 115262306a36Sopenharmony_ci msleep(20); 115362306a36Sopenharmony_ci } 115462306a36Sopenharmony_ci 115562306a36Sopenharmony_ci if (pq->num_pending || pq->num_sending) { 115662306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt; 115762306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt_prev; 115862306a36Sopenharmony_ci struct list_head free_list; 115962306a36Sopenharmony_ci 116062306a36Sopenharmony_ci mutex_lock(&pq->lock); 116162306a36Sopenharmony_ci spin_lock_irqsave(&ppd->sdma_lock, flags); 116262306a36Sopenharmony_ci /* 116362306a36Sopenharmony_ci * Since we hold sdma_lock, it is safe without sent_lock. 116462306a36Sopenharmony_ci */ 116562306a36Sopenharmony_ci if (pq->num_pending) { 116662306a36Sopenharmony_ci list_for_each_entry_safe(pkt, pkt_prev, 116762306a36Sopenharmony_ci &ppd->sdma_userpending, list) { 116862306a36Sopenharmony_ci if (pkt->pq == pq) { 116962306a36Sopenharmony_ci list_move_tail(&pkt->list, &pq->sent); 117062306a36Sopenharmony_ci pq->num_pending--; 117162306a36Sopenharmony_ci pq->num_sending++; 117262306a36Sopenharmony_ci } 117362306a36Sopenharmony_ci } 117462306a36Sopenharmony_ci } 117562306a36Sopenharmony_ci spin_unlock_irqrestore(&ppd->sdma_lock, flags); 117662306a36Sopenharmony_ci 117762306a36Sopenharmony_ci qib_dev_err(dd, "user sdma lists not empty: forcing!\n"); 117862306a36Sopenharmony_ci INIT_LIST_HEAD(&free_list); 117962306a36Sopenharmony_ci list_splice_init(&pq->sent, &free_list); 118062306a36Sopenharmony_ci pq->num_sending = 0; 118162306a36Sopenharmony_ci qib_user_sdma_free_pkt_list(&dd->pcidev->dev, pq, &free_list); 118262306a36Sopenharmony_ci mutex_unlock(&pq->lock); 118362306a36Sopenharmony_ci } 118462306a36Sopenharmony_ci} 118562306a36Sopenharmony_ci 118662306a36Sopenharmony_cistatic inline __le64 qib_sdma_make_desc0(u8 gen, 118762306a36Sopenharmony_ci u64 addr, u64 dwlen, u64 dwoffset) 118862306a36Sopenharmony_ci{ 118962306a36Sopenharmony_ci return cpu_to_le64(/* SDmaPhyAddr[31:0] */ 119062306a36Sopenharmony_ci ((addr & 0xfffffffcULL) << 32) | 119162306a36Sopenharmony_ci /* SDmaGeneration[1:0] */ 119262306a36Sopenharmony_ci ((gen & 3ULL) << 30) | 119362306a36Sopenharmony_ci /* SDmaDwordCount[10:0] */ 119462306a36Sopenharmony_ci ((dwlen & 0x7ffULL) << 16) | 119562306a36Sopenharmony_ci /* SDmaBufOffset[12:2] */ 119662306a36Sopenharmony_ci (dwoffset & 0x7ffULL)); 119762306a36Sopenharmony_ci} 119862306a36Sopenharmony_ci 119962306a36Sopenharmony_cistatic inline __le64 qib_sdma_make_first_desc0(__le64 descq) 120062306a36Sopenharmony_ci{ 120162306a36Sopenharmony_ci return descq | cpu_to_le64(1ULL << 12); 120262306a36Sopenharmony_ci} 120362306a36Sopenharmony_ci 120462306a36Sopenharmony_cistatic inline __le64 qib_sdma_make_last_desc0(__le64 descq) 120562306a36Sopenharmony_ci{ 120662306a36Sopenharmony_ci /* last */ /* dma head */ 120762306a36Sopenharmony_ci return descq | cpu_to_le64(1ULL << 11 | 1ULL << 13); 120862306a36Sopenharmony_ci} 120962306a36Sopenharmony_ci 121062306a36Sopenharmony_cistatic inline __le64 qib_sdma_make_desc1(u64 addr) 121162306a36Sopenharmony_ci{ 121262306a36Sopenharmony_ci /* SDmaPhyAddr[47:32] */ 121362306a36Sopenharmony_ci return cpu_to_le64(addr >> 32); 121462306a36Sopenharmony_ci} 121562306a36Sopenharmony_ci 121662306a36Sopenharmony_cistatic void qib_user_sdma_send_frag(struct qib_pportdata *ppd, 121762306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt, int idx, 121862306a36Sopenharmony_ci unsigned ofs, u16 tail, u8 gen) 121962306a36Sopenharmony_ci{ 122062306a36Sopenharmony_ci const u64 addr = (u64) pkt->addr[idx].addr + 122162306a36Sopenharmony_ci (u64) pkt->addr[idx].offset; 122262306a36Sopenharmony_ci const u64 dwlen = (u64) pkt->addr[idx].length / 4; 122362306a36Sopenharmony_ci __le64 *descqp; 122462306a36Sopenharmony_ci __le64 descq0; 122562306a36Sopenharmony_ci 122662306a36Sopenharmony_ci descqp = &ppd->sdma_descq[tail].qw[0]; 122762306a36Sopenharmony_ci 122862306a36Sopenharmony_ci descq0 = qib_sdma_make_desc0(gen, addr, dwlen, ofs); 122962306a36Sopenharmony_ci if (pkt->addr[idx].first_desc) 123062306a36Sopenharmony_ci descq0 = qib_sdma_make_first_desc0(descq0); 123162306a36Sopenharmony_ci if (pkt->addr[idx].last_desc) { 123262306a36Sopenharmony_ci descq0 = qib_sdma_make_last_desc0(descq0); 123362306a36Sopenharmony_ci if (ppd->sdma_intrequest) { 123462306a36Sopenharmony_ci descq0 |= cpu_to_le64(1ULL << 15); 123562306a36Sopenharmony_ci ppd->sdma_intrequest = 0; 123662306a36Sopenharmony_ci } 123762306a36Sopenharmony_ci } 123862306a36Sopenharmony_ci 123962306a36Sopenharmony_ci descqp[0] = descq0; 124062306a36Sopenharmony_ci descqp[1] = qib_sdma_make_desc1(addr); 124162306a36Sopenharmony_ci} 124262306a36Sopenharmony_ci 124362306a36Sopenharmony_civoid qib_user_sdma_send_desc(struct qib_pportdata *ppd, 124462306a36Sopenharmony_ci struct list_head *pktlist) 124562306a36Sopenharmony_ci{ 124662306a36Sopenharmony_ci struct qib_devdata *dd = ppd->dd; 124762306a36Sopenharmony_ci u16 nfree, nsent; 124862306a36Sopenharmony_ci u16 tail, tail_c; 124962306a36Sopenharmony_ci u8 gen, gen_c; 125062306a36Sopenharmony_ci 125162306a36Sopenharmony_ci nfree = qib_sdma_descq_freecnt(ppd); 125262306a36Sopenharmony_ci if (!nfree) 125362306a36Sopenharmony_ci return; 125462306a36Sopenharmony_ci 125562306a36Sopenharmony_ciretry: 125662306a36Sopenharmony_ci nsent = 0; 125762306a36Sopenharmony_ci tail_c = tail = ppd->sdma_descq_tail; 125862306a36Sopenharmony_ci gen_c = gen = ppd->sdma_generation; 125962306a36Sopenharmony_ci while (!list_empty(pktlist)) { 126062306a36Sopenharmony_ci struct qib_user_sdma_pkt *pkt = 126162306a36Sopenharmony_ci list_entry(pktlist->next, struct qib_user_sdma_pkt, 126262306a36Sopenharmony_ci list); 126362306a36Sopenharmony_ci int i, j, c = 0; 126462306a36Sopenharmony_ci unsigned ofs = 0; 126562306a36Sopenharmony_ci u16 dtail = tail; 126662306a36Sopenharmony_ci 126762306a36Sopenharmony_ci for (i = pkt->index; i < pkt->naddr && nfree; i++) { 126862306a36Sopenharmony_ci qib_user_sdma_send_frag(ppd, pkt, i, ofs, tail, gen); 126962306a36Sopenharmony_ci ofs += pkt->addr[i].length >> 2; 127062306a36Sopenharmony_ci 127162306a36Sopenharmony_ci if (++tail == ppd->sdma_descq_cnt) { 127262306a36Sopenharmony_ci tail = 0; 127362306a36Sopenharmony_ci ++gen; 127462306a36Sopenharmony_ci ppd->sdma_intrequest = 1; 127562306a36Sopenharmony_ci } else if (tail == (ppd->sdma_descq_cnt>>1)) { 127662306a36Sopenharmony_ci ppd->sdma_intrequest = 1; 127762306a36Sopenharmony_ci } 127862306a36Sopenharmony_ci nfree--; 127962306a36Sopenharmony_ci if (pkt->addr[i].last_desc == 0) 128062306a36Sopenharmony_ci continue; 128162306a36Sopenharmony_ci 128262306a36Sopenharmony_ci /* 128362306a36Sopenharmony_ci * If the packet is >= 2KB mtu equivalent, we 128462306a36Sopenharmony_ci * have to use the large buffers, and have to 128562306a36Sopenharmony_ci * mark each descriptor as part of a large 128662306a36Sopenharmony_ci * buffer packet. 128762306a36Sopenharmony_ci */ 128862306a36Sopenharmony_ci if (ofs > dd->piosize2kmax_dwords) { 128962306a36Sopenharmony_ci for (j = pkt->index; j <= i; j++) { 129062306a36Sopenharmony_ci ppd->sdma_descq[dtail].qw[0] |= 129162306a36Sopenharmony_ci cpu_to_le64(1ULL << 14); 129262306a36Sopenharmony_ci if (++dtail == ppd->sdma_descq_cnt) 129362306a36Sopenharmony_ci dtail = 0; 129462306a36Sopenharmony_ci } 129562306a36Sopenharmony_ci } 129662306a36Sopenharmony_ci c += i + 1 - pkt->index; 129762306a36Sopenharmony_ci pkt->index = i + 1; /* index for next first */ 129862306a36Sopenharmony_ci tail_c = dtail = tail; 129962306a36Sopenharmony_ci gen_c = gen; 130062306a36Sopenharmony_ci ofs = 0; /* reset for next packet */ 130162306a36Sopenharmony_ci } 130262306a36Sopenharmony_ci 130362306a36Sopenharmony_ci ppd->sdma_descq_added += c; 130462306a36Sopenharmony_ci nsent += c; 130562306a36Sopenharmony_ci if (pkt->index == pkt->naddr) { 130662306a36Sopenharmony_ci pkt->added = ppd->sdma_descq_added; 130762306a36Sopenharmony_ci pkt->pq->added = pkt->added; 130862306a36Sopenharmony_ci pkt->pq->num_pending--; 130962306a36Sopenharmony_ci spin_lock(&pkt->pq->sent_lock); 131062306a36Sopenharmony_ci pkt->pq->num_sending++; 131162306a36Sopenharmony_ci list_move_tail(&pkt->list, &pkt->pq->sent); 131262306a36Sopenharmony_ci spin_unlock(&pkt->pq->sent_lock); 131362306a36Sopenharmony_ci } 131462306a36Sopenharmony_ci if (!nfree || (nsent<<2) > ppd->sdma_descq_cnt) 131562306a36Sopenharmony_ci break; 131662306a36Sopenharmony_ci } 131762306a36Sopenharmony_ci 131862306a36Sopenharmony_ci /* advance the tail on the chip if necessary */ 131962306a36Sopenharmony_ci if (ppd->sdma_descq_tail != tail_c) { 132062306a36Sopenharmony_ci ppd->sdma_generation = gen_c; 132162306a36Sopenharmony_ci dd->f_sdma_update_tail(ppd, tail_c); 132262306a36Sopenharmony_ci } 132362306a36Sopenharmony_ci 132462306a36Sopenharmony_ci if (nfree && !list_empty(pktlist)) 132562306a36Sopenharmony_ci goto retry; 132662306a36Sopenharmony_ci} 132762306a36Sopenharmony_ci 132862306a36Sopenharmony_ci/* pq->lock must be held, get packets on the wire... */ 132962306a36Sopenharmony_cistatic int qib_user_sdma_push_pkts(struct qib_pportdata *ppd, 133062306a36Sopenharmony_ci struct qib_user_sdma_queue *pq, 133162306a36Sopenharmony_ci struct list_head *pktlist, int count) 133262306a36Sopenharmony_ci{ 133362306a36Sopenharmony_ci unsigned long flags; 133462306a36Sopenharmony_ci 133562306a36Sopenharmony_ci if (unlikely(!(ppd->lflags & QIBL_LINKACTIVE))) 133662306a36Sopenharmony_ci return -ECOMM; 133762306a36Sopenharmony_ci 133862306a36Sopenharmony_ci /* non-blocking mode */ 133962306a36Sopenharmony_ci if (pq->sdma_rb_node->refcount > 1) { 134062306a36Sopenharmony_ci spin_lock_irqsave(&ppd->sdma_lock, flags); 134162306a36Sopenharmony_ci if (unlikely(!__qib_sdma_running(ppd))) { 134262306a36Sopenharmony_ci spin_unlock_irqrestore(&ppd->sdma_lock, flags); 134362306a36Sopenharmony_ci return -ECOMM; 134462306a36Sopenharmony_ci } 134562306a36Sopenharmony_ci pq->num_pending += count; 134662306a36Sopenharmony_ci list_splice_tail_init(pktlist, &ppd->sdma_userpending); 134762306a36Sopenharmony_ci qib_user_sdma_send_desc(ppd, &ppd->sdma_userpending); 134862306a36Sopenharmony_ci spin_unlock_irqrestore(&ppd->sdma_lock, flags); 134962306a36Sopenharmony_ci return 0; 135062306a36Sopenharmony_ci } 135162306a36Sopenharmony_ci 135262306a36Sopenharmony_ci /* In this case, descriptors from this process are not 135362306a36Sopenharmony_ci * linked to ppd pending queue, interrupt handler 135462306a36Sopenharmony_ci * won't update this process, it is OK to directly 135562306a36Sopenharmony_ci * modify without sdma lock. 135662306a36Sopenharmony_ci */ 135762306a36Sopenharmony_ci 135862306a36Sopenharmony_ci 135962306a36Sopenharmony_ci pq->num_pending += count; 136062306a36Sopenharmony_ci /* 136162306a36Sopenharmony_ci * Blocking mode for single rail process, we must 136262306a36Sopenharmony_ci * release/regain sdma_lock to give other process 136362306a36Sopenharmony_ci * chance to make progress. This is important for 136462306a36Sopenharmony_ci * performance. 136562306a36Sopenharmony_ci */ 136662306a36Sopenharmony_ci do { 136762306a36Sopenharmony_ci spin_lock_irqsave(&ppd->sdma_lock, flags); 136862306a36Sopenharmony_ci if (unlikely(!__qib_sdma_running(ppd))) { 136962306a36Sopenharmony_ci spin_unlock_irqrestore(&ppd->sdma_lock, flags); 137062306a36Sopenharmony_ci return -ECOMM; 137162306a36Sopenharmony_ci } 137262306a36Sopenharmony_ci qib_user_sdma_send_desc(ppd, pktlist); 137362306a36Sopenharmony_ci if (!list_empty(pktlist)) 137462306a36Sopenharmony_ci qib_sdma_make_progress(ppd); 137562306a36Sopenharmony_ci spin_unlock_irqrestore(&ppd->sdma_lock, flags); 137662306a36Sopenharmony_ci } while (!list_empty(pktlist)); 137762306a36Sopenharmony_ci 137862306a36Sopenharmony_ci return 0; 137962306a36Sopenharmony_ci} 138062306a36Sopenharmony_ci 138162306a36Sopenharmony_ciint qib_user_sdma_writev(struct qib_ctxtdata *rcd, 138262306a36Sopenharmony_ci struct qib_user_sdma_queue *pq, 138362306a36Sopenharmony_ci const struct iovec *iov, 138462306a36Sopenharmony_ci unsigned long dim) 138562306a36Sopenharmony_ci{ 138662306a36Sopenharmony_ci struct qib_devdata *dd = rcd->dd; 138762306a36Sopenharmony_ci struct qib_pportdata *ppd = rcd->ppd; 138862306a36Sopenharmony_ci int ret = 0; 138962306a36Sopenharmony_ci struct list_head list; 139062306a36Sopenharmony_ci int npkts = 0; 139162306a36Sopenharmony_ci 139262306a36Sopenharmony_ci INIT_LIST_HEAD(&list); 139362306a36Sopenharmony_ci 139462306a36Sopenharmony_ci mutex_lock(&pq->lock); 139562306a36Sopenharmony_ci 139662306a36Sopenharmony_ci /* why not -ECOMM like qib_user_sdma_push_pkts() below? */ 139762306a36Sopenharmony_ci if (!qib_sdma_running(ppd)) 139862306a36Sopenharmony_ci goto done_unlock; 139962306a36Sopenharmony_ci 140062306a36Sopenharmony_ci /* if I have packets not complete yet */ 140162306a36Sopenharmony_ci if (pq->added > ppd->sdma_descq_removed) 140262306a36Sopenharmony_ci qib_user_sdma_hwqueue_clean(ppd); 140362306a36Sopenharmony_ci /* if I have complete packets to be freed */ 140462306a36Sopenharmony_ci if (pq->num_sending) 140562306a36Sopenharmony_ci qib_user_sdma_queue_clean(ppd, pq); 140662306a36Sopenharmony_ci 140762306a36Sopenharmony_ci while (dim) { 140862306a36Sopenharmony_ci int mxp = 1; 140962306a36Sopenharmony_ci int ndesc = 0; 141062306a36Sopenharmony_ci 141162306a36Sopenharmony_ci ret = qib_user_sdma_queue_pkts(dd, ppd, pq, 141262306a36Sopenharmony_ci iov, dim, &list, &mxp, &ndesc); 141362306a36Sopenharmony_ci if (ret < 0) 141462306a36Sopenharmony_ci goto done_unlock; 141562306a36Sopenharmony_ci else { 141662306a36Sopenharmony_ci dim -= ret; 141762306a36Sopenharmony_ci iov += ret; 141862306a36Sopenharmony_ci } 141962306a36Sopenharmony_ci 142062306a36Sopenharmony_ci /* force packets onto the sdma hw queue... */ 142162306a36Sopenharmony_ci if (!list_empty(&list)) { 142262306a36Sopenharmony_ci /* 142362306a36Sopenharmony_ci * Lazily clean hw queue. 142462306a36Sopenharmony_ci */ 142562306a36Sopenharmony_ci if (qib_sdma_descq_freecnt(ppd) < ndesc) { 142662306a36Sopenharmony_ci qib_user_sdma_hwqueue_clean(ppd); 142762306a36Sopenharmony_ci if (pq->num_sending) 142862306a36Sopenharmony_ci qib_user_sdma_queue_clean(ppd, pq); 142962306a36Sopenharmony_ci } 143062306a36Sopenharmony_ci 143162306a36Sopenharmony_ci ret = qib_user_sdma_push_pkts(ppd, pq, &list, mxp); 143262306a36Sopenharmony_ci if (ret < 0) 143362306a36Sopenharmony_ci goto done_unlock; 143462306a36Sopenharmony_ci else { 143562306a36Sopenharmony_ci npkts += mxp; 143662306a36Sopenharmony_ci pq->counter += mxp; 143762306a36Sopenharmony_ci } 143862306a36Sopenharmony_ci } 143962306a36Sopenharmony_ci } 144062306a36Sopenharmony_ci 144162306a36Sopenharmony_cidone_unlock: 144262306a36Sopenharmony_ci if (!list_empty(&list)) 144362306a36Sopenharmony_ci qib_user_sdma_free_pkt_list(&dd->pcidev->dev, pq, &list); 144462306a36Sopenharmony_ci mutex_unlock(&pq->lock); 144562306a36Sopenharmony_ci 144662306a36Sopenharmony_ci return (ret < 0) ? ret : npkts; 144762306a36Sopenharmony_ci} 144862306a36Sopenharmony_ci 144962306a36Sopenharmony_ciint qib_user_sdma_make_progress(struct qib_pportdata *ppd, 145062306a36Sopenharmony_ci struct qib_user_sdma_queue *pq) 145162306a36Sopenharmony_ci{ 145262306a36Sopenharmony_ci int ret = 0; 145362306a36Sopenharmony_ci 145462306a36Sopenharmony_ci mutex_lock(&pq->lock); 145562306a36Sopenharmony_ci qib_user_sdma_hwqueue_clean(ppd); 145662306a36Sopenharmony_ci ret = qib_user_sdma_queue_clean(ppd, pq); 145762306a36Sopenharmony_ci mutex_unlock(&pq->lock); 145862306a36Sopenharmony_ci 145962306a36Sopenharmony_ci return ret; 146062306a36Sopenharmony_ci} 146162306a36Sopenharmony_ci 146262306a36Sopenharmony_ciu32 qib_user_sdma_complete_counter(const struct qib_user_sdma_queue *pq) 146362306a36Sopenharmony_ci{ 146462306a36Sopenharmony_ci return pq ? pq->sent_counter : 0; 146562306a36Sopenharmony_ci} 146662306a36Sopenharmony_ci 146762306a36Sopenharmony_ciu32 qib_user_sdma_inflight_counter(struct qib_user_sdma_queue *pq) 146862306a36Sopenharmony_ci{ 146962306a36Sopenharmony_ci return pq ? pq->counter : 0; 147062306a36Sopenharmony_ci} 1471