162306a36Sopenharmony_ci/* 262306a36Sopenharmony_ci * This file is provided under a dual BSD/GPLv2 license. When using or 362306a36Sopenharmony_ci * redistributing this file, you may do so under either license. 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * GPL LICENSE SUMMARY 662306a36Sopenharmony_ci * 762306a36Sopenharmony_ci * Copyright(c) 2015 Intel Corporation. All rights reserved. 862306a36Sopenharmony_ci * Copyright(c) 2017 T-Platforms. All Rights Reserved. 962306a36Sopenharmony_ci * 1062306a36Sopenharmony_ci * This program is free software; you can redistribute it and/or modify 1162306a36Sopenharmony_ci * it under the terms of version 2 of the GNU General Public License as 1262306a36Sopenharmony_ci * published by the Free Software Foundation. 1362306a36Sopenharmony_ci * 1462306a36Sopenharmony_ci * BSD LICENSE 1562306a36Sopenharmony_ci * 1662306a36Sopenharmony_ci * Copyright(c) 2015 Intel Corporation. All rights reserved. 1762306a36Sopenharmony_ci * Copyright(c) 2017 T-Platforms. All Rights Reserved. 1862306a36Sopenharmony_ci * 1962306a36Sopenharmony_ci * Redistribution and use in source and binary forms, with or without 2062306a36Sopenharmony_ci * modification, are permitted provided that the following conditions 2162306a36Sopenharmony_ci * are met: 2262306a36Sopenharmony_ci * 2362306a36Sopenharmony_ci * * Redistributions of source code must retain the above copyright 2462306a36Sopenharmony_ci * notice, this list of conditions and the following disclaimer. 2562306a36Sopenharmony_ci * * Redistributions in binary form must reproduce the above copy 2662306a36Sopenharmony_ci * notice, this list of conditions and the following disclaimer in 2762306a36Sopenharmony_ci * the documentation and/or other materials provided with the 2862306a36Sopenharmony_ci * distribution. 2962306a36Sopenharmony_ci * * Neither the name of Intel Corporation nor the names of its 3062306a36Sopenharmony_ci * contributors may be used to endorse or promote products derived 3162306a36Sopenharmony_ci * from this software without specific prior written permission. 3262306a36Sopenharmony_ci * 3362306a36Sopenharmony_ci * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 3462306a36Sopenharmony_ci * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 3562306a36Sopenharmony_ci * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 3662306a36Sopenharmony_ci * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 3762306a36Sopenharmony_ci * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 3862306a36Sopenharmony_ci * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 3962306a36Sopenharmony_ci * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 4062306a36Sopenharmony_ci * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 4162306a36Sopenharmony_ci * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 4262306a36Sopenharmony_ci * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 4362306a36Sopenharmony_ci * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 4462306a36Sopenharmony_ci * 4562306a36Sopenharmony_ci * PCIe NTB Perf Linux driver 4662306a36Sopenharmony_ci */ 4762306a36Sopenharmony_ci 4862306a36Sopenharmony_ci/* 4962306a36Sopenharmony_ci * How to use this tool, by example. 5062306a36Sopenharmony_ci * 5162306a36Sopenharmony_ci * Assuming $DBG_DIR is something like: 5262306a36Sopenharmony_ci * '/sys/kernel/debug/ntb_perf/0000:00:03.0' 5362306a36Sopenharmony_ci * Suppose aside from local device there is at least one remote device 5462306a36Sopenharmony_ci * connected to NTB with index 0. 5562306a36Sopenharmony_ci *----------------------------------------------------------------------------- 5662306a36Sopenharmony_ci * Eg: install driver with specified chunk/total orders and dma-enabled flag 5762306a36Sopenharmony_ci * 5862306a36Sopenharmony_ci * root@self# insmod ntb_perf.ko chunk_order=19 total_order=28 use_dma 5962306a36Sopenharmony_ci *----------------------------------------------------------------------------- 6062306a36Sopenharmony_ci * Eg: check NTB ports (index) and MW mapping information 6162306a36Sopenharmony_ci * 6262306a36Sopenharmony_ci * root@self# cat $DBG_DIR/info 6362306a36Sopenharmony_ci *----------------------------------------------------------------------------- 6462306a36Sopenharmony_ci * Eg: start performance test with peer (index 0) and get the test metrics 6562306a36Sopenharmony_ci * 6662306a36Sopenharmony_ci * root@self# echo 0 > $DBG_DIR/run 6762306a36Sopenharmony_ci * root@self# cat $DBG_DIR/run 6862306a36Sopenharmony_ci */ 6962306a36Sopenharmony_ci 7062306a36Sopenharmony_ci#include <linux/init.h> 7162306a36Sopenharmony_ci#include <linux/kernel.h> 7262306a36Sopenharmony_ci#include <linux/module.h> 7362306a36Sopenharmony_ci#include <linux/sched.h> 7462306a36Sopenharmony_ci#include <linux/wait.h> 7562306a36Sopenharmony_ci#include <linux/dma-mapping.h> 7662306a36Sopenharmony_ci#include <linux/dmaengine.h> 7762306a36Sopenharmony_ci#include <linux/pci.h> 7862306a36Sopenharmony_ci#include <linux/ktime.h> 7962306a36Sopenharmony_ci#include <linux/slab.h> 8062306a36Sopenharmony_ci#include <linux/delay.h> 8162306a36Sopenharmony_ci#include <linux/sizes.h> 8262306a36Sopenharmony_ci#include <linux/workqueue.h> 8362306a36Sopenharmony_ci#include <linux/debugfs.h> 8462306a36Sopenharmony_ci#include <linux/random.h> 8562306a36Sopenharmony_ci#include <linux/ntb.h> 8662306a36Sopenharmony_ci 8762306a36Sopenharmony_ci#define DRIVER_NAME "ntb_perf" 8862306a36Sopenharmony_ci#define DRIVER_VERSION "2.0" 8962306a36Sopenharmony_ci 9062306a36Sopenharmony_ciMODULE_LICENSE("Dual BSD/GPL"); 9162306a36Sopenharmony_ciMODULE_VERSION(DRIVER_VERSION); 9262306a36Sopenharmony_ciMODULE_AUTHOR("Dave Jiang <dave.jiang@intel.com>"); 9362306a36Sopenharmony_ciMODULE_DESCRIPTION("PCIe NTB Performance Measurement Tool"); 9462306a36Sopenharmony_ci 9562306a36Sopenharmony_ci#define MAX_THREADS_CNT 32 9662306a36Sopenharmony_ci#define DEF_THREADS_CNT 1 9762306a36Sopenharmony_ci#define MAX_CHUNK_SIZE SZ_1M 9862306a36Sopenharmony_ci#define MAX_CHUNK_ORDER 20 /* no larger than 1M */ 9962306a36Sopenharmony_ci 10062306a36Sopenharmony_ci#define DMA_TRIES 100 10162306a36Sopenharmony_ci#define DMA_MDELAY 10 10262306a36Sopenharmony_ci 10362306a36Sopenharmony_ci#define MSG_TRIES 1000 10462306a36Sopenharmony_ci#define MSG_UDELAY_LOW 1000000 10562306a36Sopenharmony_ci#define MSG_UDELAY_HIGH 2000000 10662306a36Sopenharmony_ci 10762306a36Sopenharmony_ci#define PERF_BUF_LEN 1024 10862306a36Sopenharmony_ci 10962306a36Sopenharmony_cistatic unsigned long max_mw_size; 11062306a36Sopenharmony_cimodule_param(max_mw_size, ulong, 0644); 11162306a36Sopenharmony_ciMODULE_PARM_DESC(max_mw_size, "Upper limit of memory window size"); 11262306a36Sopenharmony_ci 11362306a36Sopenharmony_cistatic unsigned char chunk_order = 19; /* 512K */ 11462306a36Sopenharmony_cimodule_param(chunk_order, byte, 0644); 11562306a36Sopenharmony_ciMODULE_PARM_DESC(chunk_order, "Data chunk order [2^n] to transfer"); 11662306a36Sopenharmony_ci 11762306a36Sopenharmony_cistatic unsigned char total_order = 30; /* 1G */ 11862306a36Sopenharmony_cimodule_param(total_order, byte, 0644); 11962306a36Sopenharmony_ciMODULE_PARM_DESC(total_order, "Total data order [2^n] to transfer"); 12062306a36Sopenharmony_ci 12162306a36Sopenharmony_cistatic bool use_dma; /* default to 0 */ 12262306a36Sopenharmony_cimodule_param(use_dma, bool, 0644); 12362306a36Sopenharmony_ciMODULE_PARM_DESC(use_dma, "Use DMA engine to measure performance"); 12462306a36Sopenharmony_ci 12562306a36Sopenharmony_ci/*============================================================================== 12662306a36Sopenharmony_ci * Perf driver data definition 12762306a36Sopenharmony_ci *============================================================================== 12862306a36Sopenharmony_ci */ 12962306a36Sopenharmony_ci 13062306a36Sopenharmony_cienum perf_cmd { 13162306a36Sopenharmony_ci PERF_CMD_INVAL = -1,/* invalid spad command */ 13262306a36Sopenharmony_ci PERF_CMD_SSIZE = 0, /* send out buffer size */ 13362306a36Sopenharmony_ci PERF_CMD_RSIZE = 1, /* recv in buffer size */ 13462306a36Sopenharmony_ci PERF_CMD_SXLAT = 2, /* send in buffer xlat */ 13562306a36Sopenharmony_ci PERF_CMD_RXLAT = 3, /* recv out buffer xlat */ 13662306a36Sopenharmony_ci PERF_CMD_CLEAR = 4, /* clear allocated memory */ 13762306a36Sopenharmony_ci PERF_STS_DONE = 5, /* init is done */ 13862306a36Sopenharmony_ci PERF_STS_LNKUP = 6, /* link up state flag */ 13962306a36Sopenharmony_ci}; 14062306a36Sopenharmony_ci 14162306a36Sopenharmony_cistruct perf_ctx; 14262306a36Sopenharmony_ci 14362306a36Sopenharmony_cistruct perf_peer { 14462306a36Sopenharmony_ci struct perf_ctx *perf; 14562306a36Sopenharmony_ci int pidx; 14662306a36Sopenharmony_ci int gidx; 14762306a36Sopenharmony_ci 14862306a36Sopenharmony_ci /* Outbound MW params */ 14962306a36Sopenharmony_ci u64 outbuf_xlat; 15062306a36Sopenharmony_ci resource_size_t outbuf_size; 15162306a36Sopenharmony_ci void __iomem *outbuf; 15262306a36Sopenharmony_ci phys_addr_t out_phys_addr; 15362306a36Sopenharmony_ci dma_addr_t dma_dst_addr; 15462306a36Sopenharmony_ci /* Inbound MW params */ 15562306a36Sopenharmony_ci dma_addr_t inbuf_xlat; 15662306a36Sopenharmony_ci resource_size_t inbuf_size; 15762306a36Sopenharmony_ci void *inbuf; 15862306a36Sopenharmony_ci 15962306a36Sopenharmony_ci /* NTB connection setup service */ 16062306a36Sopenharmony_ci struct work_struct service; 16162306a36Sopenharmony_ci unsigned long sts; 16262306a36Sopenharmony_ci 16362306a36Sopenharmony_ci struct completion init_comp; 16462306a36Sopenharmony_ci}; 16562306a36Sopenharmony_ci#define to_peer_service(__work) \ 16662306a36Sopenharmony_ci container_of(__work, struct perf_peer, service) 16762306a36Sopenharmony_ci 16862306a36Sopenharmony_cistruct perf_thread { 16962306a36Sopenharmony_ci struct perf_ctx *perf; 17062306a36Sopenharmony_ci int tidx; 17162306a36Sopenharmony_ci 17262306a36Sopenharmony_ci /* DMA-based test sync parameters */ 17362306a36Sopenharmony_ci atomic_t dma_sync; 17462306a36Sopenharmony_ci wait_queue_head_t dma_wait; 17562306a36Sopenharmony_ci struct dma_chan *dma_chan; 17662306a36Sopenharmony_ci 17762306a36Sopenharmony_ci /* Data source and measured statistics */ 17862306a36Sopenharmony_ci void *src; 17962306a36Sopenharmony_ci u64 copied; 18062306a36Sopenharmony_ci ktime_t duration; 18162306a36Sopenharmony_ci int status; 18262306a36Sopenharmony_ci struct work_struct work; 18362306a36Sopenharmony_ci}; 18462306a36Sopenharmony_ci#define to_thread_work(__work) \ 18562306a36Sopenharmony_ci container_of(__work, struct perf_thread, work) 18662306a36Sopenharmony_ci 18762306a36Sopenharmony_cistruct perf_ctx { 18862306a36Sopenharmony_ci struct ntb_dev *ntb; 18962306a36Sopenharmony_ci 19062306a36Sopenharmony_ci /* Global device index and peers descriptors */ 19162306a36Sopenharmony_ci int gidx; 19262306a36Sopenharmony_ci int pcnt; 19362306a36Sopenharmony_ci struct perf_peer *peers; 19462306a36Sopenharmony_ci 19562306a36Sopenharmony_ci /* Performance measuring work-threads interface */ 19662306a36Sopenharmony_ci unsigned long busy_flag; 19762306a36Sopenharmony_ci wait_queue_head_t twait; 19862306a36Sopenharmony_ci atomic_t tsync; 19962306a36Sopenharmony_ci u8 tcnt; 20062306a36Sopenharmony_ci struct perf_peer *test_peer; 20162306a36Sopenharmony_ci struct perf_thread threads[MAX_THREADS_CNT]; 20262306a36Sopenharmony_ci 20362306a36Sopenharmony_ci /* Scratchpad/Message IO operations */ 20462306a36Sopenharmony_ci int (*cmd_send)(struct perf_peer *peer, enum perf_cmd cmd, u64 data); 20562306a36Sopenharmony_ci int (*cmd_recv)(struct perf_ctx *perf, int *pidx, enum perf_cmd *cmd, 20662306a36Sopenharmony_ci u64 *data); 20762306a36Sopenharmony_ci 20862306a36Sopenharmony_ci struct dentry *dbgfs_dir; 20962306a36Sopenharmony_ci}; 21062306a36Sopenharmony_ci 21162306a36Sopenharmony_ci/* 21262306a36Sopenharmony_ci * Scratchpads-base commands interface 21362306a36Sopenharmony_ci */ 21462306a36Sopenharmony_ci#define PERF_SPAD_CNT(_pcnt) \ 21562306a36Sopenharmony_ci (3*((_pcnt) + 1)) 21662306a36Sopenharmony_ci#define PERF_SPAD_CMD(_gidx) \ 21762306a36Sopenharmony_ci (3*(_gidx)) 21862306a36Sopenharmony_ci#define PERF_SPAD_LDATA(_gidx) \ 21962306a36Sopenharmony_ci (3*(_gidx) + 1) 22062306a36Sopenharmony_ci#define PERF_SPAD_HDATA(_gidx) \ 22162306a36Sopenharmony_ci (3*(_gidx) + 2) 22262306a36Sopenharmony_ci#define PERF_SPAD_NOTIFY(_gidx) \ 22362306a36Sopenharmony_ci (BIT_ULL(_gidx)) 22462306a36Sopenharmony_ci 22562306a36Sopenharmony_ci/* 22662306a36Sopenharmony_ci * Messages-base commands interface 22762306a36Sopenharmony_ci */ 22862306a36Sopenharmony_ci#define PERF_MSG_CNT 3 22962306a36Sopenharmony_ci#define PERF_MSG_CMD 0 23062306a36Sopenharmony_ci#define PERF_MSG_LDATA 1 23162306a36Sopenharmony_ci#define PERF_MSG_HDATA 2 23262306a36Sopenharmony_ci 23362306a36Sopenharmony_ci/*============================================================================== 23462306a36Sopenharmony_ci * Static data declarations 23562306a36Sopenharmony_ci *============================================================================== 23662306a36Sopenharmony_ci */ 23762306a36Sopenharmony_ci 23862306a36Sopenharmony_cistatic struct dentry *perf_dbgfs_topdir; 23962306a36Sopenharmony_ci 24062306a36Sopenharmony_cistatic struct workqueue_struct *perf_wq __read_mostly; 24162306a36Sopenharmony_ci 24262306a36Sopenharmony_ci/*============================================================================== 24362306a36Sopenharmony_ci * NTB cross-link commands execution service 24462306a36Sopenharmony_ci *============================================================================== 24562306a36Sopenharmony_ci */ 24662306a36Sopenharmony_ci 24762306a36Sopenharmony_cistatic void perf_terminate_test(struct perf_ctx *perf); 24862306a36Sopenharmony_ci 24962306a36Sopenharmony_cistatic inline bool perf_link_is_up(struct perf_peer *peer) 25062306a36Sopenharmony_ci{ 25162306a36Sopenharmony_ci u64 link; 25262306a36Sopenharmony_ci 25362306a36Sopenharmony_ci link = ntb_link_is_up(peer->perf->ntb, NULL, NULL); 25462306a36Sopenharmony_ci return !!(link & BIT_ULL_MASK(peer->pidx)); 25562306a36Sopenharmony_ci} 25662306a36Sopenharmony_ci 25762306a36Sopenharmony_cistatic int perf_spad_cmd_send(struct perf_peer *peer, enum perf_cmd cmd, 25862306a36Sopenharmony_ci u64 data) 25962306a36Sopenharmony_ci{ 26062306a36Sopenharmony_ci struct perf_ctx *perf = peer->perf; 26162306a36Sopenharmony_ci int try; 26262306a36Sopenharmony_ci u32 sts; 26362306a36Sopenharmony_ci 26462306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "CMD send: %d 0x%llx\n", cmd, data); 26562306a36Sopenharmony_ci 26662306a36Sopenharmony_ci /* 26762306a36Sopenharmony_ci * Perform predefined number of attempts before give up. 26862306a36Sopenharmony_ci * We are sending the data to the port specific scratchpad, so 26962306a36Sopenharmony_ci * to prevent a multi-port access race-condition. Additionally 27062306a36Sopenharmony_ci * there is no need in local locking since only thread-safe 27162306a36Sopenharmony_ci * service work is using this method. 27262306a36Sopenharmony_ci */ 27362306a36Sopenharmony_ci for (try = 0; try < MSG_TRIES; try++) { 27462306a36Sopenharmony_ci if (!perf_link_is_up(peer)) 27562306a36Sopenharmony_ci return -ENOLINK; 27662306a36Sopenharmony_ci 27762306a36Sopenharmony_ci sts = ntb_peer_spad_read(perf->ntb, peer->pidx, 27862306a36Sopenharmony_ci PERF_SPAD_CMD(perf->gidx)); 27962306a36Sopenharmony_ci if (sts != PERF_CMD_INVAL) { 28062306a36Sopenharmony_ci usleep_range(MSG_UDELAY_LOW, MSG_UDELAY_HIGH); 28162306a36Sopenharmony_ci continue; 28262306a36Sopenharmony_ci } 28362306a36Sopenharmony_ci 28462306a36Sopenharmony_ci ntb_peer_spad_write(perf->ntb, peer->pidx, 28562306a36Sopenharmony_ci PERF_SPAD_LDATA(perf->gidx), 28662306a36Sopenharmony_ci lower_32_bits(data)); 28762306a36Sopenharmony_ci ntb_peer_spad_write(perf->ntb, peer->pidx, 28862306a36Sopenharmony_ci PERF_SPAD_HDATA(perf->gidx), 28962306a36Sopenharmony_ci upper_32_bits(data)); 29062306a36Sopenharmony_ci ntb_peer_spad_write(perf->ntb, peer->pidx, 29162306a36Sopenharmony_ci PERF_SPAD_CMD(perf->gidx), 29262306a36Sopenharmony_ci cmd); 29362306a36Sopenharmony_ci ntb_peer_db_set(perf->ntb, PERF_SPAD_NOTIFY(peer->gidx)); 29462306a36Sopenharmony_ci 29562306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "DB ring peer %#llx\n", 29662306a36Sopenharmony_ci PERF_SPAD_NOTIFY(peer->gidx)); 29762306a36Sopenharmony_ci 29862306a36Sopenharmony_ci break; 29962306a36Sopenharmony_ci } 30062306a36Sopenharmony_ci 30162306a36Sopenharmony_ci return try < MSG_TRIES ? 0 : -EAGAIN; 30262306a36Sopenharmony_ci} 30362306a36Sopenharmony_ci 30462306a36Sopenharmony_cistatic int perf_spad_cmd_recv(struct perf_ctx *perf, int *pidx, 30562306a36Sopenharmony_ci enum perf_cmd *cmd, u64 *data) 30662306a36Sopenharmony_ci{ 30762306a36Sopenharmony_ci struct perf_peer *peer; 30862306a36Sopenharmony_ci u32 val; 30962306a36Sopenharmony_ci 31062306a36Sopenharmony_ci ntb_db_clear(perf->ntb, PERF_SPAD_NOTIFY(perf->gidx)); 31162306a36Sopenharmony_ci 31262306a36Sopenharmony_ci /* 31362306a36Sopenharmony_ci * We start scanning all over, since cleared DB may have been set 31462306a36Sopenharmony_ci * by any peer. Yes, it makes peer with smaller index being 31562306a36Sopenharmony_ci * serviced with greater priority, but it's convenient for spad 31662306a36Sopenharmony_ci * and message code unification and simplicity. 31762306a36Sopenharmony_ci */ 31862306a36Sopenharmony_ci for (*pidx = 0; *pidx < perf->pcnt; (*pidx)++) { 31962306a36Sopenharmony_ci peer = &perf->peers[*pidx]; 32062306a36Sopenharmony_ci 32162306a36Sopenharmony_ci if (!perf_link_is_up(peer)) 32262306a36Sopenharmony_ci continue; 32362306a36Sopenharmony_ci 32462306a36Sopenharmony_ci val = ntb_spad_read(perf->ntb, PERF_SPAD_CMD(peer->gidx)); 32562306a36Sopenharmony_ci if (val == PERF_CMD_INVAL) 32662306a36Sopenharmony_ci continue; 32762306a36Sopenharmony_ci 32862306a36Sopenharmony_ci *cmd = val; 32962306a36Sopenharmony_ci 33062306a36Sopenharmony_ci val = ntb_spad_read(perf->ntb, PERF_SPAD_LDATA(peer->gidx)); 33162306a36Sopenharmony_ci *data = val; 33262306a36Sopenharmony_ci 33362306a36Sopenharmony_ci val = ntb_spad_read(perf->ntb, PERF_SPAD_HDATA(peer->gidx)); 33462306a36Sopenharmony_ci *data |= (u64)val << 32; 33562306a36Sopenharmony_ci 33662306a36Sopenharmony_ci /* Next command can be retrieved from now */ 33762306a36Sopenharmony_ci ntb_spad_write(perf->ntb, PERF_SPAD_CMD(peer->gidx), 33862306a36Sopenharmony_ci PERF_CMD_INVAL); 33962306a36Sopenharmony_ci 34062306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "CMD recv: %d 0x%llx\n", *cmd, *data); 34162306a36Sopenharmony_ci 34262306a36Sopenharmony_ci return 0; 34362306a36Sopenharmony_ci } 34462306a36Sopenharmony_ci 34562306a36Sopenharmony_ci return -ENODATA; 34662306a36Sopenharmony_ci} 34762306a36Sopenharmony_ci 34862306a36Sopenharmony_cistatic int perf_msg_cmd_send(struct perf_peer *peer, enum perf_cmd cmd, 34962306a36Sopenharmony_ci u64 data) 35062306a36Sopenharmony_ci{ 35162306a36Sopenharmony_ci struct perf_ctx *perf = peer->perf; 35262306a36Sopenharmony_ci int try, ret; 35362306a36Sopenharmony_ci u64 outbits; 35462306a36Sopenharmony_ci 35562306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "CMD send: %d 0x%llx\n", cmd, data); 35662306a36Sopenharmony_ci 35762306a36Sopenharmony_ci /* 35862306a36Sopenharmony_ci * Perform predefined number of attempts before give up. Message 35962306a36Sopenharmony_ci * registers are free of race-condition problem when accessed 36062306a36Sopenharmony_ci * from different ports, so we don't need splitting registers 36162306a36Sopenharmony_ci * by global device index. We also won't have local locking, 36262306a36Sopenharmony_ci * since the method is used from service work only. 36362306a36Sopenharmony_ci */ 36462306a36Sopenharmony_ci outbits = ntb_msg_outbits(perf->ntb); 36562306a36Sopenharmony_ci for (try = 0; try < MSG_TRIES; try++) { 36662306a36Sopenharmony_ci if (!perf_link_is_up(peer)) 36762306a36Sopenharmony_ci return -ENOLINK; 36862306a36Sopenharmony_ci 36962306a36Sopenharmony_ci ret = ntb_msg_clear_sts(perf->ntb, outbits); 37062306a36Sopenharmony_ci if (ret) 37162306a36Sopenharmony_ci return ret; 37262306a36Sopenharmony_ci 37362306a36Sopenharmony_ci ntb_peer_msg_write(perf->ntb, peer->pidx, PERF_MSG_LDATA, 37462306a36Sopenharmony_ci lower_32_bits(data)); 37562306a36Sopenharmony_ci 37662306a36Sopenharmony_ci if (ntb_msg_read_sts(perf->ntb) & outbits) { 37762306a36Sopenharmony_ci usleep_range(MSG_UDELAY_LOW, MSG_UDELAY_HIGH); 37862306a36Sopenharmony_ci continue; 37962306a36Sopenharmony_ci } 38062306a36Sopenharmony_ci 38162306a36Sopenharmony_ci ntb_peer_msg_write(perf->ntb, peer->pidx, PERF_MSG_HDATA, 38262306a36Sopenharmony_ci upper_32_bits(data)); 38362306a36Sopenharmony_ci 38462306a36Sopenharmony_ci /* This call shall trigger peer message event */ 38562306a36Sopenharmony_ci ntb_peer_msg_write(perf->ntb, peer->pidx, PERF_MSG_CMD, cmd); 38662306a36Sopenharmony_ci 38762306a36Sopenharmony_ci break; 38862306a36Sopenharmony_ci } 38962306a36Sopenharmony_ci 39062306a36Sopenharmony_ci return try < MSG_TRIES ? 0 : -EAGAIN; 39162306a36Sopenharmony_ci} 39262306a36Sopenharmony_ci 39362306a36Sopenharmony_cistatic int perf_msg_cmd_recv(struct perf_ctx *perf, int *pidx, 39462306a36Sopenharmony_ci enum perf_cmd *cmd, u64 *data) 39562306a36Sopenharmony_ci{ 39662306a36Sopenharmony_ci u64 inbits; 39762306a36Sopenharmony_ci u32 val; 39862306a36Sopenharmony_ci 39962306a36Sopenharmony_ci inbits = ntb_msg_inbits(perf->ntb); 40062306a36Sopenharmony_ci 40162306a36Sopenharmony_ci if (hweight64(ntb_msg_read_sts(perf->ntb) & inbits) < 3) 40262306a36Sopenharmony_ci return -ENODATA; 40362306a36Sopenharmony_ci 40462306a36Sopenharmony_ci val = ntb_msg_read(perf->ntb, pidx, PERF_MSG_CMD); 40562306a36Sopenharmony_ci *cmd = val; 40662306a36Sopenharmony_ci 40762306a36Sopenharmony_ci val = ntb_msg_read(perf->ntb, pidx, PERF_MSG_LDATA); 40862306a36Sopenharmony_ci *data = val; 40962306a36Sopenharmony_ci 41062306a36Sopenharmony_ci val = ntb_msg_read(perf->ntb, pidx, PERF_MSG_HDATA); 41162306a36Sopenharmony_ci *data |= (u64)val << 32; 41262306a36Sopenharmony_ci 41362306a36Sopenharmony_ci /* Next command can be retrieved from now */ 41462306a36Sopenharmony_ci ntb_msg_clear_sts(perf->ntb, inbits); 41562306a36Sopenharmony_ci 41662306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "CMD recv: %d 0x%llx\n", *cmd, *data); 41762306a36Sopenharmony_ci 41862306a36Sopenharmony_ci return 0; 41962306a36Sopenharmony_ci} 42062306a36Sopenharmony_ci 42162306a36Sopenharmony_cistatic int perf_cmd_send(struct perf_peer *peer, enum perf_cmd cmd, u64 data) 42262306a36Sopenharmony_ci{ 42362306a36Sopenharmony_ci struct perf_ctx *perf = peer->perf; 42462306a36Sopenharmony_ci 42562306a36Sopenharmony_ci if (cmd == PERF_CMD_SSIZE || cmd == PERF_CMD_SXLAT) 42662306a36Sopenharmony_ci return perf->cmd_send(peer, cmd, data); 42762306a36Sopenharmony_ci 42862306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "Send invalid command\n"); 42962306a36Sopenharmony_ci return -EINVAL; 43062306a36Sopenharmony_ci} 43162306a36Sopenharmony_ci 43262306a36Sopenharmony_cistatic int perf_cmd_exec(struct perf_peer *peer, enum perf_cmd cmd) 43362306a36Sopenharmony_ci{ 43462306a36Sopenharmony_ci switch (cmd) { 43562306a36Sopenharmony_ci case PERF_CMD_SSIZE: 43662306a36Sopenharmony_ci case PERF_CMD_RSIZE: 43762306a36Sopenharmony_ci case PERF_CMD_SXLAT: 43862306a36Sopenharmony_ci case PERF_CMD_RXLAT: 43962306a36Sopenharmony_ci case PERF_CMD_CLEAR: 44062306a36Sopenharmony_ci break; 44162306a36Sopenharmony_ci default: 44262306a36Sopenharmony_ci dev_err(&peer->perf->ntb->dev, "Exec invalid command\n"); 44362306a36Sopenharmony_ci return -EINVAL; 44462306a36Sopenharmony_ci } 44562306a36Sopenharmony_ci 44662306a36Sopenharmony_ci /* No need of memory barrier, since bit ops have invernal lock */ 44762306a36Sopenharmony_ci set_bit(cmd, &peer->sts); 44862306a36Sopenharmony_ci 44962306a36Sopenharmony_ci dev_dbg(&peer->perf->ntb->dev, "CMD exec: %d\n", cmd); 45062306a36Sopenharmony_ci 45162306a36Sopenharmony_ci (void)queue_work(system_highpri_wq, &peer->service); 45262306a36Sopenharmony_ci 45362306a36Sopenharmony_ci return 0; 45462306a36Sopenharmony_ci} 45562306a36Sopenharmony_ci 45662306a36Sopenharmony_cistatic int perf_cmd_recv(struct perf_ctx *perf) 45762306a36Sopenharmony_ci{ 45862306a36Sopenharmony_ci struct perf_peer *peer; 45962306a36Sopenharmony_ci int ret, pidx, cmd; 46062306a36Sopenharmony_ci u64 data; 46162306a36Sopenharmony_ci 46262306a36Sopenharmony_ci while (!(ret = perf->cmd_recv(perf, &pidx, &cmd, &data))) { 46362306a36Sopenharmony_ci peer = &perf->peers[pidx]; 46462306a36Sopenharmony_ci 46562306a36Sopenharmony_ci switch (cmd) { 46662306a36Sopenharmony_ci case PERF_CMD_SSIZE: 46762306a36Sopenharmony_ci peer->inbuf_size = data; 46862306a36Sopenharmony_ci return perf_cmd_exec(peer, PERF_CMD_RSIZE); 46962306a36Sopenharmony_ci case PERF_CMD_SXLAT: 47062306a36Sopenharmony_ci peer->outbuf_xlat = data; 47162306a36Sopenharmony_ci return perf_cmd_exec(peer, PERF_CMD_RXLAT); 47262306a36Sopenharmony_ci default: 47362306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "Recv invalid command\n"); 47462306a36Sopenharmony_ci return -EINVAL; 47562306a36Sopenharmony_ci } 47662306a36Sopenharmony_ci } 47762306a36Sopenharmony_ci 47862306a36Sopenharmony_ci /* Return 0 if no data left to process, otherwise an error */ 47962306a36Sopenharmony_ci return ret == -ENODATA ? 0 : ret; 48062306a36Sopenharmony_ci} 48162306a36Sopenharmony_ci 48262306a36Sopenharmony_cistatic void perf_link_event(void *ctx) 48362306a36Sopenharmony_ci{ 48462306a36Sopenharmony_ci struct perf_ctx *perf = ctx; 48562306a36Sopenharmony_ci struct perf_peer *peer; 48662306a36Sopenharmony_ci bool lnk_up; 48762306a36Sopenharmony_ci int pidx; 48862306a36Sopenharmony_ci 48962306a36Sopenharmony_ci for (pidx = 0; pidx < perf->pcnt; pidx++) { 49062306a36Sopenharmony_ci peer = &perf->peers[pidx]; 49162306a36Sopenharmony_ci 49262306a36Sopenharmony_ci lnk_up = perf_link_is_up(peer); 49362306a36Sopenharmony_ci 49462306a36Sopenharmony_ci if (lnk_up && 49562306a36Sopenharmony_ci !test_and_set_bit(PERF_STS_LNKUP, &peer->sts)) { 49662306a36Sopenharmony_ci perf_cmd_exec(peer, PERF_CMD_SSIZE); 49762306a36Sopenharmony_ci } else if (!lnk_up && 49862306a36Sopenharmony_ci test_and_clear_bit(PERF_STS_LNKUP, &peer->sts)) { 49962306a36Sopenharmony_ci perf_cmd_exec(peer, PERF_CMD_CLEAR); 50062306a36Sopenharmony_ci } 50162306a36Sopenharmony_ci } 50262306a36Sopenharmony_ci} 50362306a36Sopenharmony_ci 50462306a36Sopenharmony_cistatic void perf_db_event(void *ctx, int vec) 50562306a36Sopenharmony_ci{ 50662306a36Sopenharmony_ci struct perf_ctx *perf = ctx; 50762306a36Sopenharmony_ci 50862306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "DB vec %d mask %#llx bits %#llx\n", vec, 50962306a36Sopenharmony_ci ntb_db_vector_mask(perf->ntb, vec), ntb_db_read(perf->ntb)); 51062306a36Sopenharmony_ci 51162306a36Sopenharmony_ci /* Just receive all available commands */ 51262306a36Sopenharmony_ci (void)perf_cmd_recv(perf); 51362306a36Sopenharmony_ci} 51462306a36Sopenharmony_ci 51562306a36Sopenharmony_cistatic void perf_msg_event(void *ctx) 51662306a36Sopenharmony_ci{ 51762306a36Sopenharmony_ci struct perf_ctx *perf = ctx; 51862306a36Sopenharmony_ci 51962306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "Msg status bits %#llx\n", 52062306a36Sopenharmony_ci ntb_msg_read_sts(perf->ntb)); 52162306a36Sopenharmony_ci 52262306a36Sopenharmony_ci /* Messages are only sent one-by-one */ 52362306a36Sopenharmony_ci (void)perf_cmd_recv(perf); 52462306a36Sopenharmony_ci} 52562306a36Sopenharmony_ci 52662306a36Sopenharmony_cistatic const struct ntb_ctx_ops perf_ops = { 52762306a36Sopenharmony_ci .link_event = perf_link_event, 52862306a36Sopenharmony_ci .db_event = perf_db_event, 52962306a36Sopenharmony_ci .msg_event = perf_msg_event 53062306a36Sopenharmony_ci}; 53162306a36Sopenharmony_ci 53262306a36Sopenharmony_cistatic void perf_free_outbuf(struct perf_peer *peer) 53362306a36Sopenharmony_ci{ 53462306a36Sopenharmony_ci (void)ntb_peer_mw_clear_trans(peer->perf->ntb, peer->pidx, peer->gidx); 53562306a36Sopenharmony_ci} 53662306a36Sopenharmony_ci 53762306a36Sopenharmony_cistatic int perf_setup_outbuf(struct perf_peer *peer) 53862306a36Sopenharmony_ci{ 53962306a36Sopenharmony_ci struct perf_ctx *perf = peer->perf; 54062306a36Sopenharmony_ci int ret; 54162306a36Sopenharmony_ci 54262306a36Sopenharmony_ci /* Outbuf size can be unaligned due to custom max_mw_size */ 54362306a36Sopenharmony_ci ret = ntb_peer_mw_set_trans(perf->ntb, peer->pidx, peer->gidx, 54462306a36Sopenharmony_ci peer->outbuf_xlat, peer->outbuf_size); 54562306a36Sopenharmony_ci if (ret) { 54662306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "Failed to set outbuf translation\n"); 54762306a36Sopenharmony_ci return ret; 54862306a36Sopenharmony_ci } 54962306a36Sopenharmony_ci 55062306a36Sopenharmony_ci /* Initialization is finally done */ 55162306a36Sopenharmony_ci set_bit(PERF_STS_DONE, &peer->sts); 55262306a36Sopenharmony_ci complete_all(&peer->init_comp); 55362306a36Sopenharmony_ci 55462306a36Sopenharmony_ci return 0; 55562306a36Sopenharmony_ci} 55662306a36Sopenharmony_ci 55762306a36Sopenharmony_cistatic void perf_free_inbuf(struct perf_peer *peer) 55862306a36Sopenharmony_ci{ 55962306a36Sopenharmony_ci if (!peer->inbuf) 56062306a36Sopenharmony_ci return; 56162306a36Sopenharmony_ci 56262306a36Sopenharmony_ci (void)ntb_mw_clear_trans(peer->perf->ntb, peer->pidx, peer->gidx); 56362306a36Sopenharmony_ci dma_free_coherent(&peer->perf->ntb->pdev->dev, peer->inbuf_size, 56462306a36Sopenharmony_ci peer->inbuf, peer->inbuf_xlat); 56562306a36Sopenharmony_ci peer->inbuf = NULL; 56662306a36Sopenharmony_ci} 56762306a36Sopenharmony_ci 56862306a36Sopenharmony_cistatic int perf_setup_inbuf(struct perf_peer *peer) 56962306a36Sopenharmony_ci{ 57062306a36Sopenharmony_ci resource_size_t xlat_align, size_align, size_max; 57162306a36Sopenharmony_ci struct perf_ctx *perf = peer->perf; 57262306a36Sopenharmony_ci int ret; 57362306a36Sopenharmony_ci 57462306a36Sopenharmony_ci /* Get inbound MW parameters */ 57562306a36Sopenharmony_ci ret = ntb_mw_get_align(perf->ntb, peer->pidx, perf->gidx, 57662306a36Sopenharmony_ci &xlat_align, &size_align, &size_max); 57762306a36Sopenharmony_ci if (ret) { 57862306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "Couldn't get inbuf restrictions\n"); 57962306a36Sopenharmony_ci return ret; 58062306a36Sopenharmony_ci } 58162306a36Sopenharmony_ci 58262306a36Sopenharmony_ci if (peer->inbuf_size > size_max) { 58362306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "Too big inbuf size %pa > %pa\n", 58462306a36Sopenharmony_ci &peer->inbuf_size, &size_max); 58562306a36Sopenharmony_ci return -EINVAL; 58662306a36Sopenharmony_ci } 58762306a36Sopenharmony_ci 58862306a36Sopenharmony_ci peer->inbuf_size = round_up(peer->inbuf_size, size_align); 58962306a36Sopenharmony_ci 59062306a36Sopenharmony_ci perf_free_inbuf(peer); 59162306a36Sopenharmony_ci 59262306a36Sopenharmony_ci peer->inbuf = dma_alloc_coherent(&perf->ntb->pdev->dev, 59362306a36Sopenharmony_ci peer->inbuf_size, &peer->inbuf_xlat, 59462306a36Sopenharmony_ci GFP_KERNEL); 59562306a36Sopenharmony_ci if (!peer->inbuf) { 59662306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "Failed to alloc inbuf of %pa\n", 59762306a36Sopenharmony_ci &peer->inbuf_size); 59862306a36Sopenharmony_ci return -ENOMEM; 59962306a36Sopenharmony_ci } 60062306a36Sopenharmony_ci if (!IS_ALIGNED(peer->inbuf_xlat, xlat_align)) { 60162306a36Sopenharmony_ci ret = -EINVAL; 60262306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "Unaligned inbuf allocated\n"); 60362306a36Sopenharmony_ci goto err_free_inbuf; 60462306a36Sopenharmony_ci } 60562306a36Sopenharmony_ci 60662306a36Sopenharmony_ci ret = ntb_mw_set_trans(perf->ntb, peer->pidx, peer->gidx, 60762306a36Sopenharmony_ci peer->inbuf_xlat, peer->inbuf_size); 60862306a36Sopenharmony_ci if (ret) { 60962306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "Failed to set inbuf translation\n"); 61062306a36Sopenharmony_ci goto err_free_inbuf; 61162306a36Sopenharmony_ci } 61262306a36Sopenharmony_ci 61362306a36Sopenharmony_ci /* 61462306a36Sopenharmony_ci * We submit inbuf xlat transmission cmd for execution here to follow 61562306a36Sopenharmony_ci * the code architecture, even though this method is called from service 61662306a36Sopenharmony_ci * work itself so the command will be executed right after it returns. 61762306a36Sopenharmony_ci */ 61862306a36Sopenharmony_ci (void)perf_cmd_exec(peer, PERF_CMD_SXLAT); 61962306a36Sopenharmony_ci 62062306a36Sopenharmony_ci return 0; 62162306a36Sopenharmony_ci 62262306a36Sopenharmony_cierr_free_inbuf: 62362306a36Sopenharmony_ci perf_free_inbuf(peer); 62462306a36Sopenharmony_ci 62562306a36Sopenharmony_ci return ret; 62662306a36Sopenharmony_ci} 62762306a36Sopenharmony_ci 62862306a36Sopenharmony_cistatic void perf_service_work(struct work_struct *work) 62962306a36Sopenharmony_ci{ 63062306a36Sopenharmony_ci struct perf_peer *peer = to_peer_service(work); 63162306a36Sopenharmony_ci 63262306a36Sopenharmony_ci if (test_and_clear_bit(PERF_CMD_SSIZE, &peer->sts)) 63362306a36Sopenharmony_ci perf_cmd_send(peer, PERF_CMD_SSIZE, peer->outbuf_size); 63462306a36Sopenharmony_ci 63562306a36Sopenharmony_ci if (test_and_clear_bit(PERF_CMD_RSIZE, &peer->sts)) 63662306a36Sopenharmony_ci perf_setup_inbuf(peer); 63762306a36Sopenharmony_ci 63862306a36Sopenharmony_ci if (test_and_clear_bit(PERF_CMD_SXLAT, &peer->sts)) 63962306a36Sopenharmony_ci perf_cmd_send(peer, PERF_CMD_SXLAT, peer->inbuf_xlat); 64062306a36Sopenharmony_ci 64162306a36Sopenharmony_ci if (test_and_clear_bit(PERF_CMD_RXLAT, &peer->sts)) 64262306a36Sopenharmony_ci perf_setup_outbuf(peer); 64362306a36Sopenharmony_ci 64462306a36Sopenharmony_ci if (test_and_clear_bit(PERF_CMD_CLEAR, &peer->sts)) { 64562306a36Sopenharmony_ci init_completion(&peer->init_comp); 64662306a36Sopenharmony_ci clear_bit(PERF_STS_DONE, &peer->sts); 64762306a36Sopenharmony_ci if (test_bit(0, &peer->perf->busy_flag) && 64862306a36Sopenharmony_ci peer == peer->perf->test_peer) { 64962306a36Sopenharmony_ci dev_warn(&peer->perf->ntb->dev, 65062306a36Sopenharmony_ci "Freeing while test on-fly\n"); 65162306a36Sopenharmony_ci perf_terminate_test(peer->perf); 65262306a36Sopenharmony_ci } 65362306a36Sopenharmony_ci perf_free_outbuf(peer); 65462306a36Sopenharmony_ci perf_free_inbuf(peer); 65562306a36Sopenharmony_ci } 65662306a36Sopenharmony_ci} 65762306a36Sopenharmony_ci 65862306a36Sopenharmony_cistatic int perf_init_service(struct perf_ctx *perf) 65962306a36Sopenharmony_ci{ 66062306a36Sopenharmony_ci u64 mask; 66162306a36Sopenharmony_ci 66262306a36Sopenharmony_ci if (ntb_peer_mw_count(perf->ntb) < perf->pcnt) { 66362306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "Not enough memory windows\n"); 66462306a36Sopenharmony_ci return -EINVAL; 66562306a36Sopenharmony_ci } 66662306a36Sopenharmony_ci 66762306a36Sopenharmony_ci if (ntb_msg_count(perf->ntb) >= PERF_MSG_CNT) { 66862306a36Sopenharmony_ci perf->cmd_send = perf_msg_cmd_send; 66962306a36Sopenharmony_ci perf->cmd_recv = perf_msg_cmd_recv; 67062306a36Sopenharmony_ci 67162306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "Message service initialized\n"); 67262306a36Sopenharmony_ci 67362306a36Sopenharmony_ci return 0; 67462306a36Sopenharmony_ci } 67562306a36Sopenharmony_ci 67662306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "Message service unsupported\n"); 67762306a36Sopenharmony_ci 67862306a36Sopenharmony_ci mask = GENMASK_ULL(perf->pcnt, 0); 67962306a36Sopenharmony_ci if (ntb_spad_count(perf->ntb) >= PERF_SPAD_CNT(perf->pcnt) && 68062306a36Sopenharmony_ci (ntb_db_valid_mask(perf->ntb) & mask) == mask) { 68162306a36Sopenharmony_ci perf->cmd_send = perf_spad_cmd_send; 68262306a36Sopenharmony_ci perf->cmd_recv = perf_spad_cmd_recv; 68362306a36Sopenharmony_ci 68462306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "Scratchpad service initialized\n"); 68562306a36Sopenharmony_ci 68662306a36Sopenharmony_ci return 0; 68762306a36Sopenharmony_ci } 68862306a36Sopenharmony_ci 68962306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "Scratchpad service unsupported\n"); 69062306a36Sopenharmony_ci 69162306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "Command services unsupported\n"); 69262306a36Sopenharmony_ci 69362306a36Sopenharmony_ci return -EINVAL; 69462306a36Sopenharmony_ci} 69562306a36Sopenharmony_ci 69662306a36Sopenharmony_cistatic int perf_enable_service(struct perf_ctx *perf) 69762306a36Sopenharmony_ci{ 69862306a36Sopenharmony_ci u64 mask, incmd_bit; 69962306a36Sopenharmony_ci int ret, sidx, scnt; 70062306a36Sopenharmony_ci 70162306a36Sopenharmony_ci mask = ntb_db_valid_mask(perf->ntb); 70262306a36Sopenharmony_ci (void)ntb_db_set_mask(perf->ntb, mask); 70362306a36Sopenharmony_ci 70462306a36Sopenharmony_ci ret = ntb_set_ctx(perf->ntb, perf, &perf_ops); 70562306a36Sopenharmony_ci if (ret) 70662306a36Sopenharmony_ci return ret; 70762306a36Sopenharmony_ci 70862306a36Sopenharmony_ci if (perf->cmd_send == perf_msg_cmd_send) { 70962306a36Sopenharmony_ci u64 inbits, outbits; 71062306a36Sopenharmony_ci 71162306a36Sopenharmony_ci inbits = ntb_msg_inbits(perf->ntb); 71262306a36Sopenharmony_ci outbits = ntb_msg_outbits(perf->ntb); 71362306a36Sopenharmony_ci (void)ntb_msg_set_mask(perf->ntb, inbits | outbits); 71462306a36Sopenharmony_ci 71562306a36Sopenharmony_ci incmd_bit = BIT_ULL(__ffs64(inbits)); 71662306a36Sopenharmony_ci ret = ntb_msg_clear_mask(perf->ntb, incmd_bit); 71762306a36Sopenharmony_ci 71862306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "MSG sts unmasked %#llx\n", incmd_bit); 71962306a36Sopenharmony_ci } else { 72062306a36Sopenharmony_ci scnt = ntb_spad_count(perf->ntb); 72162306a36Sopenharmony_ci for (sidx = 0; sidx < scnt; sidx++) 72262306a36Sopenharmony_ci ntb_spad_write(perf->ntb, sidx, PERF_CMD_INVAL); 72362306a36Sopenharmony_ci incmd_bit = PERF_SPAD_NOTIFY(perf->gidx); 72462306a36Sopenharmony_ci ret = ntb_db_clear_mask(perf->ntb, incmd_bit); 72562306a36Sopenharmony_ci 72662306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "DB bits unmasked %#llx\n", incmd_bit); 72762306a36Sopenharmony_ci } 72862306a36Sopenharmony_ci if (ret) { 72962306a36Sopenharmony_ci ntb_clear_ctx(perf->ntb); 73062306a36Sopenharmony_ci return ret; 73162306a36Sopenharmony_ci } 73262306a36Sopenharmony_ci 73362306a36Sopenharmony_ci ntb_link_enable(perf->ntb, NTB_SPEED_AUTO, NTB_WIDTH_AUTO); 73462306a36Sopenharmony_ci /* Might be not necessary */ 73562306a36Sopenharmony_ci ntb_link_event(perf->ntb); 73662306a36Sopenharmony_ci 73762306a36Sopenharmony_ci return 0; 73862306a36Sopenharmony_ci} 73962306a36Sopenharmony_ci 74062306a36Sopenharmony_cistatic void perf_disable_service(struct perf_ctx *perf) 74162306a36Sopenharmony_ci{ 74262306a36Sopenharmony_ci int pidx; 74362306a36Sopenharmony_ci 74462306a36Sopenharmony_ci if (perf->cmd_send == perf_msg_cmd_send) { 74562306a36Sopenharmony_ci u64 inbits; 74662306a36Sopenharmony_ci 74762306a36Sopenharmony_ci inbits = ntb_msg_inbits(perf->ntb); 74862306a36Sopenharmony_ci (void)ntb_msg_set_mask(perf->ntb, inbits); 74962306a36Sopenharmony_ci } else { 75062306a36Sopenharmony_ci (void)ntb_db_set_mask(perf->ntb, PERF_SPAD_NOTIFY(perf->gidx)); 75162306a36Sopenharmony_ci } 75262306a36Sopenharmony_ci 75362306a36Sopenharmony_ci ntb_clear_ctx(perf->ntb); 75462306a36Sopenharmony_ci 75562306a36Sopenharmony_ci for (pidx = 0; pidx < perf->pcnt; pidx++) 75662306a36Sopenharmony_ci perf_cmd_exec(&perf->peers[pidx], PERF_CMD_CLEAR); 75762306a36Sopenharmony_ci 75862306a36Sopenharmony_ci for (pidx = 0; pidx < perf->pcnt; pidx++) 75962306a36Sopenharmony_ci flush_work(&perf->peers[pidx].service); 76062306a36Sopenharmony_ci 76162306a36Sopenharmony_ci for (pidx = 0; pidx < perf->pcnt; pidx++) { 76262306a36Sopenharmony_ci struct perf_peer *peer = &perf->peers[pidx]; 76362306a36Sopenharmony_ci 76462306a36Sopenharmony_ci ntb_spad_write(perf->ntb, PERF_SPAD_CMD(peer->gidx), 0); 76562306a36Sopenharmony_ci } 76662306a36Sopenharmony_ci 76762306a36Sopenharmony_ci ntb_db_clear(perf->ntb, PERF_SPAD_NOTIFY(perf->gidx)); 76862306a36Sopenharmony_ci 76962306a36Sopenharmony_ci ntb_link_disable(perf->ntb); 77062306a36Sopenharmony_ci} 77162306a36Sopenharmony_ci 77262306a36Sopenharmony_ci/*============================================================================== 77362306a36Sopenharmony_ci * Performance measuring work-thread 77462306a36Sopenharmony_ci *============================================================================== 77562306a36Sopenharmony_ci */ 77662306a36Sopenharmony_ci 77762306a36Sopenharmony_cistatic void perf_dma_copy_callback(void *data) 77862306a36Sopenharmony_ci{ 77962306a36Sopenharmony_ci struct perf_thread *pthr = data; 78062306a36Sopenharmony_ci 78162306a36Sopenharmony_ci atomic_dec(&pthr->dma_sync); 78262306a36Sopenharmony_ci wake_up(&pthr->dma_wait); 78362306a36Sopenharmony_ci} 78462306a36Sopenharmony_ci 78562306a36Sopenharmony_cistatic int perf_copy_chunk(struct perf_thread *pthr, 78662306a36Sopenharmony_ci void __iomem *dst, void *src, size_t len) 78762306a36Sopenharmony_ci{ 78862306a36Sopenharmony_ci struct dma_async_tx_descriptor *tx; 78962306a36Sopenharmony_ci struct dmaengine_unmap_data *unmap; 79062306a36Sopenharmony_ci struct device *dma_dev; 79162306a36Sopenharmony_ci int try = 0, ret = 0; 79262306a36Sopenharmony_ci struct perf_peer *peer = pthr->perf->test_peer; 79362306a36Sopenharmony_ci void __iomem *vbase; 79462306a36Sopenharmony_ci void __iomem *dst_vaddr; 79562306a36Sopenharmony_ci dma_addr_t dst_dma_addr; 79662306a36Sopenharmony_ci 79762306a36Sopenharmony_ci if (!use_dma) { 79862306a36Sopenharmony_ci memcpy_toio(dst, src, len); 79962306a36Sopenharmony_ci goto ret_check_tsync; 80062306a36Sopenharmony_ci } 80162306a36Sopenharmony_ci 80262306a36Sopenharmony_ci dma_dev = pthr->dma_chan->device->dev; 80362306a36Sopenharmony_ci 80462306a36Sopenharmony_ci if (!is_dma_copy_aligned(pthr->dma_chan->device, offset_in_page(src), 80562306a36Sopenharmony_ci offset_in_page(dst), len)) 80662306a36Sopenharmony_ci return -EIO; 80762306a36Sopenharmony_ci 80862306a36Sopenharmony_ci vbase = peer->outbuf; 80962306a36Sopenharmony_ci dst_vaddr = dst; 81062306a36Sopenharmony_ci dst_dma_addr = peer->dma_dst_addr + (dst_vaddr - vbase); 81162306a36Sopenharmony_ci 81262306a36Sopenharmony_ci unmap = dmaengine_get_unmap_data(dma_dev, 1, GFP_NOWAIT); 81362306a36Sopenharmony_ci if (!unmap) 81462306a36Sopenharmony_ci return -ENOMEM; 81562306a36Sopenharmony_ci 81662306a36Sopenharmony_ci unmap->len = len; 81762306a36Sopenharmony_ci unmap->addr[0] = dma_map_page(dma_dev, virt_to_page(src), 81862306a36Sopenharmony_ci offset_in_page(src), len, DMA_TO_DEVICE); 81962306a36Sopenharmony_ci if (dma_mapping_error(dma_dev, unmap->addr[0])) { 82062306a36Sopenharmony_ci ret = -EIO; 82162306a36Sopenharmony_ci goto err_free_resource; 82262306a36Sopenharmony_ci } 82362306a36Sopenharmony_ci unmap->to_cnt = 1; 82462306a36Sopenharmony_ci 82562306a36Sopenharmony_ci do { 82662306a36Sopenharmony_ci tx = dmaengine_prep_dma_memcpy(pthr->dma_chan, dst_dma_addr, 82762306a36Sopenharmony_ci unmap->addr[0], len, DMA_PREP_INTERRUPT | DMA_CTRL_ACK); 82862306a36Sopenharmony_ci if (!tx) 82962306a36Sopenharmony_ci msleep(DMA_MDELAY); 83062306a36Sopenharmony_ci } while (!tx && (try++ < DMA_TRIES)); 83162306a36Sopenharmony_ci 83262306a36Sopenharmony_ci if (!tx) { 83362306a36Sopenharmony_ci ret = -EIO; 83462306a36Sopenharmony_ci goto err_free_resource; 83562306a36Sopenharmony_ci } 83662306a36Sopenharmony_ci 83762306a36Sopenharmony_ci tx->callback = perf_dma_copy_callback; 83862306a36Sopenharmony_ci tx->callback_param = pthr; 83962306a36Sopenharmony_ci dma_set_unmap(tx, unmap); 84062306a36Sopenharmony_ci 84162306a36Sopenharmony_ci ret = dma_submit_error(dmaengine_submit(tx)); 84262306a36Sopenharmony_ci if (ret) { 84362306a36Sopenharmony_ci dmaengine_unmap_put(unmap); 84462306a36Sopenharmony_ci goto err_free_resource; 84562306a36Sopenharmony_ci } 84662306a36Sopenharmony_ci 84762306a36Sopenharmony_ci dmaengine_unmap_put(unmap); 84862306a36Sopenharmony_ci 84962306a36Sopenharmony_ci atomic_inc(&pthr->dma_sync); 85062306a36Sopenharmony_ci dma_async_issue_pending(pthr->dma_chan); 85162306a36Sopenharmony_ci 85262306a36Sopenharmony_ciret_check_tsync: 85362306a36Sopenharmony_ci return likely(atomic_read(&pthr->perf->tsync) > 0) ? 0 : -EINTR; 85462306a36Sopenharmony_ci 85562306a36Sopenharmony_cierr_free_resource: 85662306a36Sopenharmony_ci dmaengine_unmap_put(unmap); 85762306a36Sopenharmony_ci 85862306a36Sopenharmony_ci return ret; 85962306a36Sopenharmony_ci} 86062306a36Sopenharmony_ci 86162306a36Sopenharmony_cistatic bool perf_dma_filter(struct dma_chan *chan, void *data) 86262306a36Sopenharmony_ci{ 86362306a36Sopenharmony_ci struct perf_ctx *perf = data; 86462306a36Sopenharmony_ci int node; 86562306a36Sopenharmony_ci 86662306a36Sopenharmony_ci node = dev_to_node(&perf->ntb->dev); 86762306a36Sopenharmony_ci 86862306a36Sopenharmony_ci return node == NUMA_NO_NODE || node == dev_to_node(chan->device->dev); 86962306a36Sopenharmony_ci} 87062306a36Sopenharmony_ci 87162306a36Sopenharmony_cistatic int perf_init_test(struct perf_thread *pthr) 87262306a36Sopenharmony_ci{ 87362306a36Sopenharmony_ci struct perf_ctx *perf = pthr->perf; 87462306a36Sopenharmony_ci dma_cap_mask_t dma_mask; 87562306a36Sopenharmony_ci struct perf_peer *peer = pthr->perf->test_peer; 87662306a36Sopenharmony_ci 87762306a36Sopenharmony_ci pthr->src = kmalloc_node(perf->test_peer->outbuf_size, GFP_KERNEL, 87862306a36Sopenharmony_ci dev_to_node(&perf->ntb->dev)); 87962306a36Sopenharmony_ci if (!pthr->src) 88062306a36Sopenharmony_ci return -ENOMEM; 88162306a36Sopenharmony_ci 88262306a36Sopenharmony_ci get_random_bytes(pthr->src, perf->test_peer->outbuf_size); 88362306a36Sopenharmony_ci 88462306a36Sopenharmony_ci if (!use_dma) 88562306a36Sopenharmony_ci return 0; 88662306a36Sopenharmony_ci 88762306a36Sopenharmony_ci dma_cap_zero(dma_mask); 88862306a36Sopenharmony_ci dma_cap_set(DMA_MEMCPY, dma_mask); 88962306a36Sopenharmony_ci pthr->dma_chan = dma_request_channel(dma_mask, perf_dma_filter, perf); 89062306a36Sopenharmony_ci if (!pthr->dma_chan) { 89162306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "%d: Failed to get DMA channel\n", 89262306a36Sopenharmony_ci pthr->tidx); 89362306a36Sopenharmony_ci goto err_free; 89462306a36Sopenharmony_ci } 89562306a36Sopenharmony_ci peer->dma_dst_addr = 89662306a36Sopenharmony_ci dma_map_resource(pthr->dma_chan->device->dev, 89762306a36Sopenharmony_ci peer->out_phys_addr, peer->outbuf_size, 89862306a36Sopenharmony_ci DMA_FROM_DEVICE, 0); 89962306a36Sopenharmony_ci if (dma_mapping_error(pthr->dma_chan->device->dev, 90062306a36Sopenharmony_ci peer->dma_dst_addr)) { 90162306a36Sopenharmony_ci dev_err(pthr->dma_chan->device->dev, "%d: Failed to map DMA addr\n", 90262306a36Sopenharmony_ci pthr->tidx); 90362306a36Sopenharmony_ci peer->dma_dst_addr = 0; 90462306a36Sopenharmony_ci dma_release_channel(pthr->dma_chan); 90562306a36Sopenharmony_ci goto err_free; 90662306a36Sopenharmony_ci } 90762306a36Sopenharmony_ci dev_dbg(pthr->dma_chan->device->dev, "%d: Map MMIO %pa to DMA addr %pad\n", 90862306a36Sopenharmony_ci pthr->tidx, 90962306a36Sopenharmony_ci &peer->out_phys_addr, 91062306a36Sopenharmony_ci &peer->dma_dst_addr); 91162306a36Sopenharmony_ci 91262306a36Sopenharmony_ci atomic_set(&pthr->dma_sync, 0); 91362306a36Sopenharmony_ci return 0; 91462306a36Sopenharmony_ci 91562306a36Sopenharmony_cierr_free: 91662306a36Sopenharmony_ci atomic_dec(&perf->tsync); 91762306a36Sopenharmony_ci wake_up(&perf->twait); 91862306a36Sopenharmony_ci kfree(pthr->src); 91962306a36Sopenharmony_ci return -ENODEV; 92062306a36Sopenharmony_ci} 92162306a36Sopenharmony_ci 92262306a36Sopenharmony_cistatic int perf_run_test(struct perf_thread *pthr) 92362306a36Sopenharmony_ci{ 92462306a36Sopenharmony_ci struct perf_peer *peer = pthr->perf->test_peer; 92562306a36Sopenharmony_ci struct perf_ctx *perf = pthr->perf; 92662306a36Sopenharmony_ci void __iomem *flt_dst, *bnd_dst; 92762306a36Sopenharmony_ci u64 total_size, chunk_size; 92862306a36Sopenharmony_ci void *flt_src; 92962306a36Sopenharmony_ci int ret = 0; 93062306a36Sopenharmony_ci 93162306a36Sopenharmony_ci total_size = 1ULL << total_order; 93262306a36Sopenharmony_ci chunk_size = 1ULL << chunk_order; 93362306a36Sopenharmony_ci chunk_size = min_t(u64, peer->outbuf_size, chunk_size); 93462306a36Sopenharmony_ci 93562306a36Sopenharmony_ci flt_src = pthr->src; 93662306a36Sopenharmony_ci bnd_dst = peer->outbuf + peer->outbuf_size; 93762306a36Sopenharmony_ci flt_dst = peer->outbuf; 93862306a36Sopenharmony_ci 93962306a36Sopenharmony_ci pthr->duration = ktime_get(); 94062306a36Sopenharmony_ci 94162306a36Sopenharmony_ci /* Copied field is cleared on test launch stage */ 94262306a36Sopenharmony_ci while (pthr->copied < total_size) { 94362306a36Sopenharmony_ci ret = perf_copy_chunk(pthr, flt_dst, flt_src, chunk_size); 94462306a36Sopenharmony_ci if (ret) { 94562306a36Sopenharmony_ci dev_err(&perf->ntb->dev, "%d: Got error %d on test\n", 94662306a36Sopenharmony_ci pthr->tidx, ret); 94762306a36Sopenharmony_ci return ret; 94862306a36Sopenharmony_ci } 94962306a36Sopenharmony_ci 95062306a36Sopenharmony_ci pthr->copied += chunk_size; 95162306a36Sopenharmony_ci 95262306a36Sopenharmony_ci flt_dst += chunk_size; 95362306a36Sopenharmony_ci flt_src += chunk_size; 95462306a36Sopenharmony_ci if (flt_dst >= bnd_dst || flt_dst < peer->outbuf) { 95562306a36Sopenharmony_ci flt_dst = peer->outbuf; 95662306a36Sopenharmony_ci flt_src = pthr->src; 95762306a36Sopenharmony_ci } 95862306a36Sopenharmony_ci 95962306a36Sopenharmony_ci /* Give up CPU to give a chance for other threads to use it */ 96062306a36Sopenharmony_ci schedule(); 96162306a36Sopenharmony_ci } 96262306a36Sopenharmony_ci 96362306a36Sopenharmony_ci return 0; 96462306a36Sopenharmony_ci} 96562306a36Sopenharmony_ci 96662306a36Sopenharmony_cistatic int perf_sync_test(struct perf_thread *pthr) 96762306a36Sopenharmony_ci{ 96862306a36Sopenharmony_ci struct perf_ctx *perf = pthr->perf; 96962306a36Sopenharmony_ci 97062306a36Sopenharmony_ci if (!use_dma) 97162306a36Sopenharmony_ci goto no_dma_ret; 97262306a36Sopenharmony_ci 97362306a36Sopenharmony_ci wait_event(pthr->dma_wait, 97462306a36Sopenharmony_ci (atomic_read(&pthr->dma_sync) == 0 || 97562306a36Sopenharmony_ci atomic_read(&perf->tsync) < 0)); 97662306a36Sopenharmony_ci 97762306a36Sopenharmony_ci if (atomic_read(&perf->tsync) < 0) 97862306a36Sopenharmony_ci return -EINTR; 97962306a36Sopenharmony_ci 98062306a36Sopenharmony_cino_dma_ret: 98162306a36Sopenharmony_ci pthr->duration = ktime_sub(ktime_get(), pthr->duration); 98262306a36Sopenharmony_ci 98362306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "%d: copied %llu bytes\n", 98462306a36Sopenharmony_ci pthr->tidx, pthr->copied); 98562306a36Sopenharmony_ci 98662306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "%d: lasted %llu usecs\n", 98762306a36Sopenharmony_ci pthr->tidx, ktime_to_us(pthr->duration)); 98862306a36Sopenharmony_ci 98962306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "%d: %llu MBytes/s\n", pthr->tidx, 99062306a36Sopenharmony_ci div64_u64(pthr->copied, ktime_to_us(pthr->duration))); 99162306a36Sopenharmony_ci 99262306a36Sopenharmony_ci return 0; 99362306a36Sopenharmony_ci} 99462306a36Sopenharmony_ci 99562306a36Sopenharmony_cistatic void perf_clear_test(struct perf_thread *pthr) 99662306a36Sopenharmony_ci{ 99762306a36Sopenharmony_ci struct perf_ctx *perf = pthr->perf; 99862306a36Sopenharmony_ci 99962306a36Sopenharmony_ci if (!use_dma) 100062306a36Sopenharmony_ci goto no_dma_notify; 100162306a36Sopenharmony_ci 100262306a36Sopenharmony_ci /* 100362306a36Sopenharmony_ci * If test finished without errors, termination isn't needed. 100462306a36Sopenharmony_ci * We call it anyway just to be sure of the transfers completion. 100562306a36Sopenharmony_ci */ 100662306a36Sopenharmony_ci (void)dmaengine_terminate_sync(pthr->dma_chan); 100762306a36Sopenharmony_ci if (pthr->perf->test_peer->dma_dst_addr) 100862306a36Sopenharmony_ci dma_unmap_resource(pthr->dma_chan->device->dev, 100962306a36Sopenharmony_ci pthr->perf->test_peer->dma_dst_addr, 101062306a36Sopenharmony_ci pthr->perf->test_peer->outbuf_size, 101162306a36Sopenharmony_ci DMA_FROM_DEVICE, 0); 101262306a36Sopenharmony_ci 101362306a36Sopenharmony_ci dma_release_channel(pthr->dma_chan); 101462306a36Sopenharmony_ci 101562306a36Sopenharmony_cino_dma_notify: 101662306a36Sopenharmony_ci atomic_dec(&perf->tsync); 101762306a36Sopenharmony_ci wake_up(&perf->twait); 101862306a36Sopenharmony_ci kfree(pthr->src); 101962306a36Sopenharmony_ci} 102062306a36Sopenharmony_ci 102162306a36Sopenharmony_cistatic void perf_thread_work(struct work_struct *work) 102262306a36Sopenharmony_ci{ 102362306a36Sopenharmony_ci struct perf_thread *pthr = to_thread_work(work); 102462306a36Sopenharmony_ci int ret; 102562306a36Sopenharmony_ci 102662306a36Sopenharmony_ci /* 102762306a36Sopenharmony_ci * Perform stages in compliance with use_dma flag value. 102862306a36Sopenharmony_ci * Test status is changed only if error happened, otherwise 102962306a36Sopenharmony_ci * status -ENODATA is kept while test is on-fly. Results 103062306a36Sopenharmony_ci * synchronization is performed only if test fininshed 103162306a36Sopenharmony_ci * without an error or interruption. 103262306a36Sopenharmony_ci */ 103362306a36Sopenharmony_ci ret = perf_init_test(pthr); 103462306a36Sopenharmony_ci if (ret) { 103562306a36Sopenharmony_ci pthr->status = ret; 103662306a36Sopenharmony_ci return; 103762306a36Sopenharmony_ci } 103862306a36Sopenharmony_ci 103962306a36Sopenharmony_ci ret = perf_run_test(pthr); 104062306a36Sopenharmony_ci if (ret) { 104162306a36Sopenharmony_ci pthr->status = ret; 104262306a36Sopenharmony_ci goto err_clear_test; 104362306a36Sopenharmony_ci } 104462306a36Sopenharmony_ci 104562306a36Sopenharmony_ci pthr->status = perf_sync_test(pthr); 104662306a36Sopenharmony_ci 104762306a36Sopenharmony_cierr_clear_test: 104862306a36Sopenharmony_ci perf_clear_test(pthr); 104962306a36Sopenharmony_ci} 105062306a36Sopenharmony_ci 105162306a36Sopenharmony_cistatic int perf_set_tcnt(struct perf_ctx *perf, u8 tcnt) 105262306a36Sopenharmony_ci{ 105362306a36Sopenharmony_ci if (tcnt == 0 || tcnt > MAX_THREADS_CNT) 105462306a36Sopenharmony_ci return -EINVAL; 105562306a36Sopenharmony_ci 105662306a36Sopenharmony_ci if (test_and_set_bit_lock(0, &perf->busy_flag)) 105762306a36Sopenharmony_ci return -EBUSY; 105862306a36Sopenharmony_ci 105962306a36Sopenharmony_ci perf->tcnt = tcnt; 106062306a36Sopenharmony_ci 106162306a36Sopenharmony_ci clear_bit_unlock(0, &perf->busy_flag); 106262306a36Sopenharmony_ci 106362306a36Sopenharmony_ci return 0; 106462306a36Sopenharmony_ci} 106562306a36Sopenharmony_ci 106662306a36Sopenharmony_cistatic void perf_terminate_test(struct perf_ctx *perf) 106762306a36Sopenharmony_ci{ 106862306a36Sopenharmony_ci int tidx; 106962306a36Sopenharmony_ci 107062306a36Sopenharmony_ci atomic_set(&perf->tsync, -1); 107162306a36Sopenharmony_ci wake_up(&perf->twait); 107262306a36Sopenharmony_ci 107362306a36Sopenharmony_ci for (tidx = 0; tidx < MAX_THREADS_CNT; tidx++) { 107462306a36Sopenharmony_ci wake_up(&perf->threads[tidx].dma_wait); 107562306a36Sopenharmony_ci cancel_work_sync(&perf->threads[tidx].work); 107662306a36Sopenharmony_ci } 107762306a36Sopenharmony_ci} 107862306a36Sopenharmony_ci 107962306a36Sopenharmony_cistatic int perf_submit_test(struct perf_peer *peer) 108062306a36Sopenharmony_ci{ 108162306a36Sopenharmony_ci struct perf_ctx *perf = peer->perf; 108262306a36Sopenharmony_ci struct perf_thread *pthr; 108362306a36Sopenharmony_ci int tidx, ret; 108462306a36Sopenharmony_ci 108562306a36Sopenharmony_ci ret = wait_for_completion_interruptible(&peer->init_comp); 108662306a36Sopenharmony_ci if (ret < 0) 108762306a36Sopenharmony_ci return ret; 108862306a36Sopenharmony_ci 108962306a36Sopenharmony_ci if (test_and_set_bit_lock(0, &perf->busy_flag)) 109062306a36Sopenharmony_ci return -EBUSY; 109162306a36Sopenharmony_ci 109262306a36Sopenharmony_ci perf->test_peer = peer; 109362306a36Sopenharmony_ci atomic_set(&perf->tsync, perf->tcnt); 109462306a36Sopenharmony_ci 109562306a36Sopenharmony_ci for (tidx = 0; tidx < MAX_THREADS_CNT; tidx++) { 109662306a36Sopenharmony_ci pthr = &perf->threads[tidx]; 109762306a36Sopenharmony_ci 109862306a36Sopenharmony_ci pthr->status = -ENODATA; 109962306a36Sopenharmony_ci pthr->copied = 0; 110062306a36Sopenharmony_ci pthr->duration = ktime_set(0, 0); 110162306a36Sopenharmony_ci if (tidx < perf->tcnt) 110262306a36Sopenharmony_ci (void)queue_work(perf_wq, &pthr->work); 110362306a36Sopenharmony_ci } 110462306a36Sopenharmony_ci 110562306a36Sopenharmony_ci ret = wait_event_interruptible(perf->twait, 110662306a36Sopenharmony_ci atomic_read(&perf->tsync) <= 0); 110762306a36Sopenharmony_ci if (ret == -ERESTARTSYS) { 110862306a36Sopenharmony_ci perf_terminate_test(perf); 110962306a36Sopenharmony_ci ret = -EINTR; 111062306a36Sopenharmony_ci } 111162306a36Sopenharmony_ci 111262306a36Sopenharmony_ci clear_bit_unlock(0, &perf->busy_flag); 111362306a36Sopenharmony_ci 111462306a36Sopenharmony_ci return ret; 111562306a36Sopenharmony_ci} 111662306a36Sopenharmony_ci 111762306a36Sopenharmony_cistatic int perf_read_stats(struct perf_ctx *perf, char *buf, 111862306a36Sopenharmony_ci size_t size, ssize_t *pos) 111962306a36Sopenharmony_ci{ 112062306a36Sopenharmony_ci struct perf_thread *pthr; 112162306a36Sopenharmony_ci int tidx; 112262306a36Sopenharmony_ci 112362306a36Sopenharmony_ci if (test_and_set_bit_lock(0, &perf->busy_flag)) 112462306a36Sopenharmony_ci return -EBUSY; 112562306a36Sopenharmony_ci 112662306a36Sopenharmony_ci (*pos) += scnprintf(buf + *pos, size - *pos, 112762306a36Sopenharmony_ci " Peer %d test statistics:\n", perf->test_peer->pidx); 112862306a36Sopenharmony_ci 112962306a36Sopenharmony_ci for (tidx = 0; tidx < MAX_THREADS_CNT; tidx++) { 113062306a36Sopenharmony_ci pthr = &perf->threads[tidx]; 113162306a36Sopenharmony_ci 113262306a36Sopenharmony_ci if (pthr->status == -ENODATA) 113362306a36Sopenharmony_ci continue; 113462306a36Sopenharmony_ci 113562306a36Sopenharmony_ci if (pthr->status) { 113662306a36Sopenharmony_ci (*pos) += scnprintf(buf + *pos, size - *pos, 113762306a36Sopenharmony_ci "%d: error status %d\n", tidx, pthr->status); 113862306a36Sopenharmony_ci continue; 113962306a36Sopenharmony_ci } 114062306a36Sopenharmony_ci 114162306a36Sopenharmony_ci (*pos) += scnprintf(buf + *pos, size - *pos, 114262306a36Sopenharmony_ci "%d: copied %llu bytes in %llu usecs, %llu MBytes/s\n", 114362306a36Sopenharmony_ci tidx, pthr->copied, ktime_to_us(pthr->duration), 114462306a36Sopenharmony_ci div64_u64(pthr->copied, ktime_to_us(pthr->duration))); 114562306a36Sopenharmony_ci } 114662306a36Sopenharmony_ci 114762306a36Sopenharmony_ci clear_bit_unlock(0, &perf->busy_flag); 114862306a36Sopenharmony_ci 114962306a36Sopenharmony_ci return 0; 115062306a36Sopenharmony_ci} 115162306a36Sopenharmony_ci 115262306a36Sopenharmony_cistatic void perf_init_threads(struct perf_ctx *perf) 115362306a36Sopenharmony_ci{ 115462306a36Sopenharmony_ci struct perf_thread *pthr; 115562306a36Sopenharmony_ci int tidx; 115662306a36Sopenharmony_ci 115762306a36Sopenharmony_ci perf->tcnt = DEF_THREADS_CNT; 115862306a36Sopenharmony_ci perf->test_peer = &perf->peers[0]; 115962306a36Sopenharmony_ci init_waitqueue_head(&perf->twait); 116062306a36Sopenharmony_ci 116162306a36Sopenharmony_ci for (tidx = 0; tidx < MAX_THREADS_CNT; tidx++) { 116262306a36Sopenharmony_ci pthr = &perf->threads[tidx]; 116362306a36Sopenharmony_ci 116462306a36Sopenharmony_ci pthr->perf = perf; 116562306a36Sopenharmony_ci pthr->tidx = tidx; 116662306a36Sopenharmony_ci pthr->status = -ENODATA; 116762306a36Sopenharmony_ci init_waitqueue_head(&pthr->dma_wait); 116862306a36Sopenharmony_ci INIT_WORK(&pthr->work, perf_thread_work); 116962306a36Sopenharmony_ci } 117062306a36Sopenharmony_ci} 117162306a36Sopenharmony_ci 117262306a36Sopenharmony_cistatic void perf_clear_threads(struct perf_ctx *perf) 117362306a36Sopenharmony_ci{ 117462306a36Sopenharmony_ci perf_terminate_test(perf); 117562306a36Sopenharmony_ci} 117662306a36Sopenharmony_ci 117762306a36Sopenharmony_ci/*============================================================================== 117862306a36Sopenharmony_ci * DebugFS nodes 117962306a36Sopenharmony_ci *============================================================================== 118062306a36Sopenharmony_ci */ 118162306a36Sopenharmony_ci 118262306a36Sopenharmony_cistatic ssize_t perf_dbgfs_read_info(struct file *filep, char __user *ubuf, 118362306a36Sopenharmony_ci size_t size, loff_t *offp) 118462306a36Sopenharmony_ci{ 118562306a36Sopenharmony_ci struct perf_ctx *perf = filep->private_data; 118662306a36Sopenharmony_ci struct perf_peer *peer; 118762306a36Sopenharmony_ci size_t buf_size; 118862306a36Sopenharmony_ci ssize_t pos = 0; 118962306a36Sopenharmony_ci int ret, pidx; 119062306a36Sopenharmony_ci char *buf; 119162306a36Sopenharmony_ci 119262306a36Sopenharmony_ci buf_size = min_t(size_t, size, 0x1000U); 119362306a36Sopenharmony_ci 119462306a36Sopenharmony_ci buf = kmalloc(buf_size, GFP_KERNEL); 119562306a36Sopenharmony_ci if (!buf) 119662306a36Sopenharmony_ci return -ENOMEM; 119762306a36Sopenharmony_ci 119862306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 119962306a36Sopenharmony_ci " Performance measuring tool info:\n\n"); 120062306a36Sopenharmony_ci 120162306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 120262306a36Sopenharmony_ci "Local port %d, Global index %d\n", ntb_port_number(perf->ntb), 120362306a36Sopenharmony_ci perf->gidx); 120462306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, "Test status: "); 120562306a36Sopenharmony_ci if (test_bit(0, &perf->busy_flag)) { 120662306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 120762306a36Sopenharmony_ci "on-fly with port %d (%d)\n", 120862306a36Sopenharmony_ci ntb_peer_port_number(perf->ntb, perf->test_peer->pidx), 120962306a36Sopenharmony_ci perf->test_peer->pidx); 121062306a36Sopenharmony_ci } else { 121162306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, "idle\n"); 121262306a36Sopenharmony_ci } 121362306a36Sopenharmony_ci 121462306a36Sopenharmony_ci for (pidx = 0; pidx < perf->pcnt; pidx++) { 121562306a36Sopenharmony_ci peer = &perf->peers[pidx]; 121662306a36Sopenharmony_ci 121762306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 121862306a36Sopenharmony_ci "Port %d (%d), Global index %d:\n", 121962306a36Sopenharmony_ci ntb_peer_port_number(perf->ntb, peer->pidx), peer->pidx, 122062306a36Sopenharmony_ci peer->gidx); 122162306a36Sopenharmony_ci 122262306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 122362306a36Sopenharmony_ci "\tLink status: %s\n", 122462306a36Sopenharmony_ci test_bit(PERF_STS_LNKUP, &peer->sts) ? "up" : "down"); 122562306a36Sopenharmony_ci 122662306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 122762306a36Sopenharmony_ci "\tOut buffer addr 0x%pK\n", peer->outbuf); 122862306a36Sopenharmony_ci 122962306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 123062306a36Sopenharmony_ci "\tOut buff phys addr %pa[p]\n", &peer->out_phys_addr); 123162306a36Sopenharmony_ci 123262306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 123362306a36Sopenharmony_ci "\tOut buffer size %pa\n", &peer->outbuf_size); 123462306a36Sopenharmony_ci 123562306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 123662306a36Sopenharmony_ci "\tOut buffer xlat 0x%016llx[p]\n", peer->outbuf_xlat); 123762306a36Sopenharmony_ci 123862306a36Sopenharmony_ci if (!peer->inbuf) { 123962306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 124062306a36Sopenharmony_ci "\tIn buffer addr: unallocated\n"); 124162306a36Sopenharmony_ci continue; 124262306a36Sopenharmony_ci } 124362306a36Sopenharmony_ci 124462306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 124562306a36Sopenharmony_ci "\tIn buffer addr 0x%pK\n", peer->inbuf); 124662306a36Sopenharmony_ci 124762306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 124862306a36Sopenharmony_ci "\tIn buffer size %pa\n", &peer->inbuf_size); 124962306a36Sopenharmony_ci 125062306a36Sopenharmony_ci pos += scnprintf(buf + pos, buf_size - pos, 125162306a36Sopenharmony_ci "\tIn buffer xlat %pad[p]\n", &peer->inbuf_xlat); 125262306a36Sopenharmony_ci } 125362306a36Sopenharmony_ci 125462306a36Sopenharmony_ci ret = simple_read_from_buffer(ubuf, size, offp, buf, pos); 125562306a36Sopenharmony_ci kfree(buf); 125662306a36Sopenharmony_ci 125762306a36Sopenharmony_ci return ret; 125862306a36Sopenharmony_ci} 125962306a36Sopenharmony_ci 126062306a36Sopenharmony_cistatic const struct file_operations perf_dbgfs_info = { 126162306a36Sopenharmony_ci .open = simple_open, 126262306a36Sopenharmony_ci .read = perf_dbgfs_read_info 126362306a36Sopenharmony_ci}; 126462306a36Sopenharmony_ci 126562306a36Sopenharmony_cistatic ssize_t perf_dbgfs_read_run(struct file *filep, char __user *ubuf, 126662306a36Sopenharmony_ci size_t size, loff_t *offp) 126762306a36Sopenharmony_ci{ 126862306a36Sopenharmony_ci struct perf_ctx *perf = filep->private_data; 126962306a36Sopenharmony_ci ssize_t ret, pos = 0; 127062306a36Sopenharmony_ci char *buf; 127162306a36Sopenharmony_ci 127262306a36Sopenharmony_ci buf = kmalloc(PERF_BUF_LEN, GFP_KERNEL); 127362306a36Sopenharmony_ci if (!buf) 127462306a36Sopenharmony_ci return -ENOMEM; 127562306a36Sopenharmony_ci 127662306a36Sopenharmony_ci ret = perf_read_stats(perf, buf, PERF_BUF_LEN, &pos); 127762306a36Sopenharmony_ci if (ret) 127862306a36Sopenharmony_ci goto err_free; 127962306a36Sopenharmony_ci 128062306a36Sopenharmony_ci ret = simple_read_from_buffer(ubuf, size, offp, buf, pos); 128162306a36Sopenharmony_cierr_free: 128262306a36Sopenharmony_ci kfree(buf); 128362306a36Sopenharmony_ci 128462306a36Sopenharmony_ci return ret; 128562306a36Sopenharmony_ci} 128662306a36Sopenharmony_ci 128762306a36Sopenharmony_cistatic ssize_t perf_dbgfs_write_run(struct file *filep, const char __user *ubuf, 128862306a36Sopenharmony_ci size_t size, loff_t *offp) 128962306a36Sopenharmony_ci{ 129062306a36Sopenharmony_ci struct perf_ctx *perf = filep->private_data; 129162306a36Sopenharmony_ci struct perf_peer *peer; 129262306a36Sopenharmony_ci int pidx, ret; 129362306a36Sopenharmony_ci 129462306a36Sopenharmony_ci ret = kstrtoint_from_user(ubuf, size, 0, &pidx); 129562306a36Sopenharmony_ci if (ret) 129662306a36Sopenharmony_ci return ret; 129762306a36Sopenharmony_ci 129862306a36Sopenharmony_ci if (pidx < 0 || pidx >= perf->pcnt) 129962306a36Sopenharmony_ci return -EINVAL; 130062306a36Sopenharmony_ci 130162306a36Sopenharmony_ci peer = &perf->peers[pidx]; 130262306a36Sopenharmony_ci 130362306a36Sopenharmony_ci ret = perf_submit_test(peer); 130462306a36Sopenharmony_ci if (ret) 130562306a36Sopenharmony_ci return ret; 130662306a36Sopenharmony_ci 130762306a36Sopenharmony_ci return size; 130862306a36Sopenharmony_ci} 130962306a36Sopenharmony_ci 131062306a36Sopenharmony_cistatic const struct file_operations perf_dbgfs_run = { 131162306a36Sopenharmony_ci .open = simple_open, 131262306a36Sopenharmony_ci .read = perf_dbgfs_read_run, 131362306a36Sopenharmony_ci .write = perf_dbgfs_write_run 131462306a36Sopenharmony_ci}; 131562306a36Sopenharmony_ci 131662306a36Sopenharmony_cistatic ssize_t perf_dbgfs_read_tcnt(struct file *filep, char __user *ubuf, 131762306a36Sopenharmony_ci size_t size, loff_t *offp) 131862306a36Sopenharmony_ci{ 131962306a36Sopenharmony_ci struct perf_ctx *perf = filep->private_data; 132062306a36Sopenharmony_ci char buf[8]; 132162306a36Sopenharmony_ci ssize_t pos; 132262306a36Sopenharmony_ci 132362306a36Sopenharmony_ci pos = scnprintf(buf, sizeof(buf), "%hhu\n", perf->tcnt); 132462306a36Sopenharmony_ci 132562306a36Sopenharmony_ci return simple_read_from_buffer(ubuf, size, offp, buf, pos); 132662306a36Sopenharmony_ci} 132762306a36Sopenharmony_ci 132862306a36Sopenharmony_cistatic ssize_t perf_dbgfs_write_tcnt(struct file *filep, 132962306a36Sopenharmony_ci const char __user *ubuf, 133062306a36Sopenharmony_ci size_t size, loff_t *offp) 133162306a36Sopenharmony_ci{ 133262306a36Sopenharmony_ci struct perf_ctx *perf = filep->private_data; 133362306a36Sopenharmony_ci int ret; 133462306a36Sopenharmony_ci u8 val; 133562306a36Sopenharmony_ci 133662306a36Sopenharmony_ci ret = kstrtou8_from_user(ubuf, size, 0, &val); 133762306a36Sopenharmony_ci if (ret) 133862306a36Sopenharmony_ci return ret; 133962306a36Sopenharmony_ci 134062306a36Sopenharmony_ci ret = perf_set_tcnt(perf, val); 134162306a36Sopenharmony_ci if (ret) 134262306a36Sopenharmony_ci return ret; 134362306a36Sopenharmony_ci 134462306a36Sopenharmony_ci return size; 134562306a36Sopenharmony_ci} 134662306a36Sopenharmony_ci 134762306a36Sopenharmony_cistatic const struct file_operations perf_dbgfs_tcnt = { 134862306a36Sopenharmony_ci .open = simple_open, 134962306a36Sopenharmony_ci .read = perf_dbgfs_read_tcnt, 135062306a36Sopenharmony_ci .write = perf_dbgfs_write_tcnt 135162306a36Sopenharmony_ci}; 135262306a36Sopenharmony_ci 135362306a36Sopenharmony_cistatic void perf_setup_dbgfs(struct perf_ctx *perf) 135462306a36Sopenharmony_ci{ 135562306a36Sopenharmony_ci struct pci_dev *pdev = perf->ntb->pdev; 135662306a36Sopenharmony_ci 135762306a36Sopenharmony_ci perf->dbgfs_dir = debugfs_create_dir(pci_name(pdev), perf_dbgfs_topdir); 135862306a36Sopenharmony_ci if (IS_ERR(perf->dbgfs_dir)) { 135962306a36Sopenharmony_ci dev_warn(&perf->ntb->dev, "DebugFS unsupported\n"); 136062306a36Sopenharmony_ci return; 136162306a36Sopenharmony_ci } 136262306a36Sopenharmony_ci 136362306a36Sopenharmony_ci debugfs_create_file("info", 0600, perf->dbgfs_dir, perf, 136462306a36Sopenharmony_ci &perf_dbgfs_info); 136562306a36Sopenharmony_ci 136662306a36Sopenharmony_ci debugfs_create_file("run", 0600, perf->dbgfs_dir, perf, 136762306a36Sopenharmony_ci &perf_dbgfs_run); 136862306a36Sopenharmony_ci 136962306a36Sopenharmony_ci debugfs_create_file("threads_count", 0600, perf->dbgfs_dir, perf, 137062306a36Sopenharmony_ci &perf_dbgfs_tcnt); 137162306a36Sopenharmony_ci 137262306a36Sopenharmony_ci /* They are made read-only for test exec safety and integrity */ 137362306a36Sopenharmony_ci debugfs_create_u8("chunk_order", 0500, perf->dbgfs_dir, &chunk_order); 137462306a36Sopenharmony_ci 137562306a36Sopenharmony_ci debugfs_create_u8("total_order", 0500, perf->dbgfs_dir, &total_order); 137662306a36Sopenharmony_ci 137762306a36Sopenharmony_ci debugfs_create_bool("use_dma", 0500, perf->dbgfs_dir, &use_dma); 137862306a36Sopenharmony_ci} 137962306a36Sopenharmony_ci 138062306a36Sopenharmony_cistatic void perf_clear_dbgfs(struct perf_ctx *perf) 138162306a36Sopenharmony_ci{ 138262306a36Sopenharmony_ci debugfs_remove_recursive(perf->dbgfs_dir); 138362306a36Sopenharmony_ci} 138462306a36Sopenharmony_ci 138562306a36Sopenharmony_ci/*============================================================================== 138662306a36Sopenharmony_ci * Basic driver initialization 138762306a36Sopenharmony_ci *============================================================================== 138862306a36Sopenharmony_ci */ 138962306a36Sopenharmony_ci 139062306a36Sopenharmony_cistatic struct perf_ctx *perf_create_data(struct ntb_dev *ntb) 139162306a36Sopenharmony_ci{ 139262306a36Sopenharmony_ci struct perf_ctx *perf; 139362306a36Sopenharmony_ci 139462306a36Sopenharmony_ci perf = devm_kzalloc(&ntb->dev, sizeof(*perf), GFP_KERNEL); 139562306a36Sopenharmony_ci if (!perf) 139662306a36Sopenharmony_ci return ERR_PTR(-ENOMEM); 139762306a36Sopenharmony_ci 139862306a36Sopenharmony_ci perf->pcnt = ntb_peer_port_count(ntb); 139962306a36Sopenharmony_ci perf->peers = devm_kcalloc(&ntb->dev, perf->pcnt, sizeof(*perf->peers), 140062306a36Sopenharmony_ci GFP_KERNEL); 140162306a36Sopenharmony_ci if (!perf->peers) 140262306a36Sopenharmony_ci return ERR_PTR(-ENOMEM); 140362306a36Sopenharmony_ci 140462306a36Sopenharmony_ci perf->ntb = ntb; 140562306a36Sopenharmony_ci 140662306a36Sopenharmony_ci return perf; 140762306a36Sopenharmony_ci} 140862306a36Sopenharmony_ci 140962306a36Sopenharmony_cistatic int perf_setup_peer_mw(struct perf_peer *peer) 141062306a36Sopenharmony_ci{ 141162306a36Sopenharmony_ci struct perf_ctx *perf = peer->perf; 141262306a36Sopenharmony_ci phys_addr_t phys_addr; 141362306a36Sopenharmony_ci int ret; 141462306a36Sopenharmony_ci 141562306a36Sopenharmony_ci /* Get outbound MW parameters and map it */ 141662306a36Sopenharmony_ci ret = ntb_peer_mw_get_addr(perf->ntb, perf->gidx, &phys_addr, 141762306a36Sopenharmony_ci &peer->outbuf_size); 141862306a36Sopenharmony_ci if (ret) 141962306a36Sopenharmony_ci return ret; 142062306a36Sopenharmony_ci 142162306a36Sopenharmony_ci peer->outbuf = devm_ioremap_wc(&perf->ntb->dev, phys_addr, 142262306a36Sopenharmony_ci peer->outbuf_size); 142362306a36Sopenharmony_ci if (!peer->outbuf) 142462306a36Sopenharmony_ci return -ENOMEM; 142562306a36Sopenharmony_ci 142662306a36Sopenharmony_ci peer->out_phys_addr = phys_addr; 142762306a36Sopenharmony_ci 142862306a36Sopenharmony_ci if (max_mw_size && peer->outbuf_size > max_mw_size) { 142962306a36Sopenharmony_ci peer->outbuf_size = max_mw_size; 143062306a36Sopenharmony_ci dev_warn(&peer->perf->ntb->dev, 143162306a36Sopenharmony_ci "Peer %d outbuf reduced to %pa\n", peer->pidx, 143262306a36Sopenharmony_ci &peer->outbuf_size); 143362306a36Sopenharmony_ci } 143462306a36Sopenharmony_ci 143562306a36Sopenharmony_ci return 0; 143662306a36Sopenharmony_ci} 143762306a36Sopenharmony_ci 143862306a36Sopenharmony_cistatic int perf_init_peers(struct perf_ctx *perf) 143962306a36Sopenharmony_ci{ 144062306a36Sopenharmony_ci struct perf_peer *peer; 144162306a36Sopenharmony_ci int pidx, lport, ret; 144262306a36Sopenharmony_ci 144362306a36Sopenharmony_ci lport = ntb_port_number(perf->ntb); 144462306a36Sopenharmony_ci perf->gidx = -1; 144562306a36Sopenharmony_ci for (pidx = 0; pidx < perf->pcnt; pidx++) { 144662306a36Sopenharmony_ci peer = &perf->peers[pidx]; 144762306a36Sopenharmony_ci 144862306a36Sopenharmony_ci peer->perf = perf; 144962306a36Sopenharmony_ci peer->pidx = pidx; 145062306a36Sopenharmony_ci if (lport < ntb_peer_port_number(perf->ntb, pidx)) { 145162306a36Sopenharmony_ci if (perf->gidx == -1) 145262306a36Sopenharmony_ci perf->gidx = pidx; 145362306a36Sopenharmony_ci peer->gidx = pidx + 1; 145462306a36Sopenharmony_ci } else { 145562306a36Sopenharmony_ci peer->gidx = pidx; 145662306a36Sopenharmony_ci } 145762306a36Sopenharmony_ci INIT_WORK(&peer->service, perf_service_work); 145862306a36Sopenharmony_ci init_completion(&peer->init_comp); 145962306a36Sopenharmony_ci } 146062306a36Sopenharmony_ci if (perf->gidx == -1) 146162306a36Sopenharmony_ci perf->gidx = pidx; 146262306a36Sopenharmony_ci 146362306a36Sopenharmony_ci /* 146462306a36Sopenharmony_ci * Hardware with only two ports may not have unique port 146562306a36Sopenharmony_ci * numbers. In this case, the gidxs should all be zero. 146662306a36Sopenharmony_ci */ 146762306a36Sopenharmony_ci if (perf->pcnt == 1 && ntb_port_number(perf->ntb) == 0 && 146862306a36Sopenharmony_ci ntb_peer_port_number(perf->ntb, 0) == 0) { 146962306a36Sopenharmony_ci perf->gidx = 0; 147062306a36Sopenharmony_ci perf->peers[0].gidx = 0; 147162306a36Sopenharmony_ci } 147262306a36Sopenharmony_ci 147362306a36Sopenharmony_ci for (pidx = 0; pidx < perf->pcnt; pidx++) { 147462306a36Sopenharmony_ci ret = perf_setup_peer_mw(&perf->peers[pidx]); 147562306a36Sopenharmony_ci if (ret) 147662306a36Sopenharmony_ci return ret; 147762306a36Sopenharmony_ci } 147862306a36Sopenharmony_ci 147962306a36Sopenharmony_ci dev_dbg(&perf->ntb->dev, "Global port index %d\n", perf->gidx); 148062306a36Sopenharmony_ci 148162306a36Sopenharmony_ci return 0; 148262306a36Sopenharmony_ci} 148362306a36Sopenharmony_ci 148462306a36Sopenharmony_cistatic int perf_probe(struct ntb_client *client, struct ntb_dev *ntb) 148562306a36Sopenharmony_ci{ 148662306a36Sopenharmony_ci struct perf_ctx *perf; 148762306a36Sopenharmony_ci int ret; 148862306a36Sopenharmony_ci 148962306a36Sopenharmony_ci perf = perf_create_data(ntb); 149062306a36Sopenharmony_ci if (IS_ERR(perf)) 149162306a36Sopenharmony_ci return PTR_ERR(perf); 149262306a36Sopenharmony_ci 149362306a36Sopenharmony_ci ret = perf_init_peers(perf); 149462306a36Sopenharmony_ci if (ret) 149562306a36Sopenharmony_ci return ret; 149662306a36Sopenharmony_ci 149762306a36Sopenharmony_ci perf_init_threads(perf); 149862306a36Sopenharmony_ci 149962306a36Sopenharmony_ci ret = perf_init_service(perf); 150062306a36Sopenharmony_ci if (ret) 150162306a36Sopenharmony_ci return ret; 150262306a36Sopenharmony_ci 150362306a36Sopenharmony_ci ret = perf_enable_service(perf); 150462306a36Sopenharmony_ci if (ret) 150562306a36Sopenharmony_ci return ret; 150662306a36Sopenharmony_ci 150762306a36Sopenharmony_ci perf_setup_dbgfs(perf); 150862306a36Sopenharmony_ci 150962306a36Sopenharmony_ci return 0; 151062306a36Sopenharmony_ci} 151162306a36Sopenharmony_ci 151262306a36Sopenharmony_cistatic void perf_remove(struct ntb_client *client, struct ntb_dev *ntb) 151362306a36Sopenharmony_ci{ 151462306a36Sopenharmony_ci struct perf_ctx *perf = ntb->ctx; 151562306a36Sopenharmony_ci 151662306a36Sopenharmony_ci perf_clear_dbgfs(perf); 151762306a36Sopenharmony_ci 151862306a36Sopenharmony_ci perf_disable_service(perf); 151962306a36Sopenharmony_ci 152062306a36Sopenharmony_ci perf_clear_threads(perf); 152162306a36Sopenharmony_ci} 152262306a36Sopenharmony_ci 152362306a36Sopenharmony_cistatic struct ntb_client perf_client = { 152462306a36Sopenharmony_ci .ops = { 152562306a36Sopenharmony_ci .probe = perf_probe, 152662306a36Sopenharmony_ci .remove = perf_remove 152762306a36Sopenharmony_ci } 152862306a36Sopenharmony_ci}; 152962306a36Sopenharmony_ci 153062306a36Sopenharmony_cistatic int __init perf_init(void) 153162306a36Sopenharmony_ci{ 153262306a36Sopenharmony_ci int ret; 153362306a36Sopenharmony_ci 153462306a36Sopenharmony_ci if (chunk_order > MAX_CHUNK_ORDER) { 153562306a36Sopenharmony_ci chunk_order = MAX_CHUNK_ORDER; 153662306a36Sopenharmony_ci pr_info("Chunk order reduced to %hhu\n", chunk_order); 153762306a36Sopenharmony_ci } 153862306a36Sopenharmony_ci 153962306a36Sopenharmony_ci if (total_order < chunk_order) { 154062306a36Sopenharmony_ci total_order = chunk_order; 154162306a36Sopenharmony_ci pr_info("Total data order reduced to %hhu\n", total_order); 154262306a36Sopenharmony_ci } 154362306a36Sopenharmony_ci 154462306a36Sopenharmony_ci perf_wq = alloc_workqueue("perf_wq", WQ_UNBOUND | WQ_SYSFS, 0); 154562306a36Sopenharmony_ci if (!perf_wq) 154662306a36Sopenharmony_ci return -ENOMEM; 154762306a36Sopenharmony_ci 154862306a36Sopenharmony_ci if (debugfs_initialized()) 154962306a36Sopenharmony_ci perf_dbgfs_topdir = debugfs_create_dir(KBUILD_MODNAME, NULL); 155062306a36Sopenharmony_ci 155162306a36Sopenharmony_ci ret = ntb_register_client(&perf_client); 155262306a36Sopenharmony_ci if (ret) { 155362306a36Sopenharmony_ci debugfs_remove_recursive(perf_dbgfs_topdir); 155462306a36Sopenharmony_ci destroy_workqueue(perf_wq); 155562306a36Sopenharmony_ci } 155662306a36Sopenharmony_ci 155762306a36Sopenharmony_ci return ret; 155862306a36Sopenharmony_ci} 155962306a36Sopenharmony_cimodule_init(perf_init); 156062306a36Sopenharmony_ci 156162306a36Sopenharmony_cistatic void __exit perf_exit(void) 156262306a36Sopenharmony_ci{ 156362306a36Sopenharmony_ci ntb_unregister_client(&perf_client); 156462306a36Sopenharmony_ci debugfs_remove_recursive(perf_dbgfs_topdir); 156562306a36Sopenharmony_ci destroy_workqueue(perf_wq); 156662306a36Sopenharmony_ci} 156762306a36Sopenharmony_cimodule_exit(perf_exit); 1568