162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 or BSD-3-Clause 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Copyright(c) 2018 Intel Corporation. 462306a36Sopenharmony_ci */ 562306a36Sopenharmony_ci 662306a36Sopenharmony_ci#include <linux/debugfs.h> 762306a36Sopenharmony_ci#include <linux/seq_file.h> 862306a36Sopenharmony_ci#include <linux/kernel.h> 962306a36Sopenharmony_ci#include <linux/types.h> 1062306a36Sopenharmony_ci#include <linux/bitmap.h> 1162306a36Sopenharmony_ci 1262306a36Sopenharmony_ci#include "debugfs.h" 1362306a36Sopenharmony_ci#include "fault.h" 1462306a36Sopenharmony_ci#include "trace.h" 1562306a36Sopenharmony_ci 1662306a36Sopenharmony_ci#define HFI1_FAULT_DIR_TX BIT(0) 1762306a36Sopenharmony_ci#define HFI1_FAULT_DIR_RX BIT(1) 1862306a36Sopenharmony_ci#define HFI1_FAULT_DIR_TXRX (HFI1_FAULT_DIR_TX | HFI1_FAULT_DIR_RX) 1962306a36Sopenharmony_ci 2062306a36Sopenharmony_cistatic void *_fault_stats_seq_start(struct seq_file *s, loff_t *pos) 2162306a36Sopenharmony_ci{ 2262306a36Sopenharmony_ci struct hfi1_opcode_stats_perctx *opstats; 2362306a36Sopenharmony_ci 2462306a36Sopenharmony_ci if (*pos >= ARRAY_SIZE(opstats->stats)) 2562306a36Sopenharmony_ci return NULL; 2662306a36Sopenharmony_ci return pos; 2762306a36Sopenharmony_ci} 2862306a36Sopenharmony_ci 2962306a36Sopenharmony_cistatic void *_fault_stats_seq_next(struct seq_file *s, void *v, loff_t *pos) 3062306a36Sopenharmony_ci{ 3162306a36Sopenharmony_ci struct hfi1_opcode_stats_perctx *opstats; 3262306a36Sopenharmony_ci 3362306a36Sopenharmony_ci ++*pos; 3462306a36Sopenharmony_ci if (*pos >= ARRAY_SIZE(opstats->stats)) 3562306a36Sopenharmony_ci return NULL; 3662306a36Sopenharmony_ci return pos; 3762306a36Sopenharmony_ci} 3862306a36Sopenharmony_ci 3962306a36Sopenharmony_cistatic void _fault_stats_seq_stop(struct seq_file *s, void *v) 4062306a36Sopenharmony_ci{ 4162306a36Sopenharmony_ci} 4262306a36Sopenharmony_ci 4362306a36Sopenharmony_cistatic int _fault_stats_seq_show(struct seq_file *s, void *v) 4462306a36Sopenharmony_ci{ 4562306a36Sopenharmony_ci loff_t *spos = v; 4662306a36Sopenharmony_ci loff_t i = *spos, j; 4762306a36Sopenharmony_ci u64 n_packets = 0, n_bytes = 0; 4862306a36Sopenharmony_ci struct hfi1_ibdev *ibd = (struct hfi1_ibdev *)s->private; 4962306a36Sopenharmony_ci struct hfi1_devdata *dd = dd_from_dev(ibd); 5062306a36Sopenharmony_ci struct hfi1_ctxtdata *rcd; 5162306a36Sopenharmony_ci 5262306a36Sopenharmony_ci for (j = 0; j < dd->first_dyn_alloc_ctxt; j++) { 5362306a36Sopenharmony_ci rcd = hfi1_rcd_get_by_index(dd, j); 5462306a36Sopenharmony_ci if (rcd) { 5562306a36Sopenharmony_ci n_packets += rcd->opstats->stats[i].n_packets; 5662306a36Sopenharmony_ci n_bytes += rcd->opstats->stats[i].n_bytes; 5762306a36Sopenharmony_ci } 5862306a36Sopenharmony_ci hfi1_rcd_put(rcd); 5962306a36Sopenharmony_ci } 6062306a36Sopenharmony_ci for_each_possible_cpu(j) { 6162306a36Sopenharmony_ci struct hfi1_opcode_stats_perctx *sp = 6262306a36Sopenharmony_ci per_cpu_ptr(dd->tx_opstats, j); 6362306a36Sopenharmony_ci 6462306a36Sopenharmony_ci n_packets += sp->stats[i].n_packets; 6562306a36Sopenharmony_ci n_bytes += sp->stats[i].n_bytes; 6662306a36Sopenharmony_ci } 6762306a36Sopenharmony_ci if (!n_packets && !n_bytes) 6862306a36Sopenharmony_ci return SEQ_SKIP; 6962306a36Sopenharmony_ci if (!ibd->fault->n_rxfaults[i] && !ibd->fault->n_txfaults[i]) 7062306a36Sopenharmony_ci return SEQ_SKIP; 7162306a36Sopenharmony_ci seq_printf(s, "%02llx %llu/%llu (faults rx:%llu faults: tx:%llu)\n", i, 7262306a36Sopenharmony_ci (unsigned long long)n_packets, 7362306a36Sopenharmony_ci (unsigned long long)n_bytes, 7462306a36Sopenharmony_ci (unsigned long long)ibd->fault->n_rxfaults[i], 7562306a36Sopenharmony_ci (unsigned long long)ibd->fault->n_txfaults[i]); 7662306a36Sopenharmony_ci return 0; 7762306a36Sopenharmony_ci} 7862306a36Sopenharmony_ci 7962306a36Sopenharmony_ciDEBUGFS_SEQ_FILE_OPS(fault_stats); 8062306a36Sopenharmony_ciDEBUGFS_SEQ_FILE_OPEN(fault_stats); 8162306a36Sopenharmony_ciDEBUGFS_FILE_OPS(fault_stats); 8262306a36Sopenharmony_ci 8362306a36Sopenharmony_cistatic int fault_opcodes_open(struct inode *inode, struct file *file) 8462306a36Sopenharmony_ci{ 8562306a36Sopenharmony_ci file->private_data = inode->i_private; 8662306a36Sopenharmony_ci return nonseekable_open(inode, file); 8762306a36Sopenharmony_ci} 8862306a36Sopenharmony_ci 8962306a36Sopenharmony_cistatic ssize_t fault_opcodes_write(struct file *file, const char __user *buf, 9062306a36Sopenharmony_ci size_t len, loff_t *pos) 9162306a36Sopenharmony_ci{ 9262306a36Sopenharmony_ci ssize_t ret = 0; 9362306a36Sopenharmony_ci /* 1280 = 256 opcodes * 4 chars/opcode + 255 commas + NULL */ 9462306a36Sopenharmony_ci size_t copy, datalen = 1280; 9562306a36Sopenharmony_ci char *data, *token, *ptr, *end; 9662306a36Sopenharmony_ci struct fault *fault = file->private_data; 9762306a36Sopenharmony_ci 9862306a36Sopenharmony_ci data = kcalloc(datalen, sizeof(*data), GFP_KERNEL); 9962306a36Sopenharmony_ci if (!data) 10062306a36Sopenharmony_ci return -ENOMEM; 10162306a36Sopenharmony_ci copy = min(len, datalen - 1); 10262306a36Sopenharmony_ci if (copy_from_user(data, buf, copy)) { 10362306a36Sopenharmony_ci ret = -EFAULT; 10462306a36Sopenharmony_ci goto free_data; 10562306a36Sopenharmony_ci } 10662306a36Sopenharmony_ci 10762306a36Sopenharmony_ci ret = debugfs_file_get(file->f_path.dentry); 10862306a36Sopenharmony_ci if (unlikely(ret)) 10962306a36Sopenharmony_ci goto free_data; 11062306a36Sopenharmony_ci ptr = data; 11162306a36Sopenharmony_ci token = ptr; 11262306a36Sopenharmony_ci for (ptr = data; *ptr; ptr = end + 1, token = ptr) { 11362306a36Sopenharmony_ci char *dash; 11462306a36Sopenharmony_ci unsigned long range_start, range_end, i; 11562306a36Sopenharmony_ci bool remove = false; 11662306a36Sopenharmony_ci unsigned long bound = 1U << BITS_PER_BYTE; 11762306a36Sopenharmony_ci 11862306a36Sopenharmony_ci end = strchr(ptr, ','); 11962306a36Sopenharmony_ci if (end) 12062306a36Sopenharmony_ci *end = '\0'; 12162306a36Sopenharmony_ci if (token[0] == '-') { 12262306a36Sopenharmony_ci remove = true; 12362306a36Sopenharmony_ci token++; 12462306a36Sopenharmony_ci } 12562306a36Sopenharmony_ci dash = strchr(token, '-'); 12662306a36Sopenharmony_ci if (dash) 12762306a36Sopenharmony_ci *dash = '\0'; 12862306a36Sopenharmony_ci if (kstrtoul(token, 0, &range_start)) 12962306a36Sopenharmony_ci break; 13062306a36Sopenharmony_ci if (dash) { 13162306a36Sopenharmony_ci token = dash + 1; 13262306a36Sopenharmony_ci if (kstrtoul(token, 0, &range_end)) 13362306a36Sopenharmony_ci break; 13462306a36Sopenharmony_ci } else { 13562306a36Sopenharmony_ci range_end = range_start; 13662306a36Sopenharmony_ci } 13762306a36Sopenharmony_ci if (range_start == range_end && range_start == -1UL) { 13862306a36Sopenharmony_ci bitmap_zero(fault->opcodes, sizeof(fault->opcodes) * 13962306a36Sopenharmony_ci BITS_PER_BYTE); 14062306a36Sopenharmony_ci break; 14162306a36Sopenharmony_ci } 14262306a36Sopenharmony_ci /* Check the inputs */ 14362306a36Sopenharmony_ci if (range_start >= bound || range_end >= bound) 14462306a36Sopenharmony_ci break; 14562306a36Sopenharmony_ci 14662306a36Sopenharmony_ci for (i = range_start; i <= range_end; i++) { 14762306a36Sopenharmony_ci if (remove) 14862306a36Sopenharmony_ci clear_bit(i, fault->opcodes); 14962306a36Sopenharmony_ci else 15062306a36Sopenharmony_ci set_bit(i, fault->opcodes); 15162306a36Sopenharmony_ci } 15262306a36Sopenharmony_ci if (!end) 15362306a36Sopenharmony_ci break; 15462306a36Sopenharmony_ci } 15562306a36Sopenharmony_ci ret = len; 15662306a36Sopenharmony_ci 15762306a36Sopenharmony_ci debugfs_file_put(file->f_path.dentry); 15862306a36Sopenharmony_cifree_data: 15962306a36Sopenharmony_ci kfree(data); 16062306a36Sopenharmony_ci return ret; 16162306a36Sopenharmony_ci} 16262306a36Sopenharmony_ci 16362306a36Sopenharmony_cistatic ssize_t fault_opcodes_read(struct file *file, char __user *buf, 16462306a36Sopenharmony_ci size_t len, loff_t *pos) 16562306a36Sopenharmony_ci{ 16662306a36Sopenharmony_ci ssize_t ret = 0; 16762306a36Sopenharmony_ci char *data; 16862306a36Sopenharmony_ci size_t datalen = 1280, size = 0; /* see fault_opcodes_write() */ 16962306a36Sopenharmony_ci unsigned long bit = 0, zero = 0; 17062306a36Sopenharmony_ci struct fault *fault = file->private_data; 17162306a36Sopenharmony_ci size_t bitsize = sizeof(fault->opcodes) * BITS_PER_BYTE; 17262306a36Sopenharmony_ci 17362306a36Sopenharmony_ci data = kcalloc(datalen, sizeof(*data), GFP_KERNEL); 17462306a36Sopenharmony_ci if (!data) 17562306a36Sopenharmony_ci return -ENOMEM; 17662306a36Sopenharmony_ci ret = debugfs_file_get(file->f_path.dentry); 17762306a36Sopenharmony_ci if (unlikely(ret)) 17862306a36Sopenharmony_ci goto free_data; 17962306a36Sopenharmony_ci bit = find_first_bit(fault->opcodes, bitsize); 18062306a36Sopenharmony_ci while (bit < bitsize) { 18162306a36Sopenharmony_ci zero = find_next_zero_bit(fault->opcodes, bitsize, bit); 18262306a36Sopenharmony_ci if (zero - 1 != bit) 18362306a36Sopenharmony_ci size += scnprintf(data + size, 18462306a36Sopenharmony_ci datalen - size - 1, 18562306a36Sopenharmony_ci "0x%lx-0x%lx,", bit, zero - 1); 18662306a36Sopenharmony_ci else 18762306a36Sopenharmony_ci size += scnprintf(data + size, 18862306a36Sopenharmony_ci datalen - size - 1, "0x%lx,", 18962306a36Sopenharmony_ci bit); 19062306a36Sopenharmony_ci bit = find_next_bit(fault->opcodes, bitsize, zero); 19162306a36Sopenharmony_ci } 19262306a36Sopenharmony_ci debugfs_file_put(file->f_path.dentry); 19362306a36Sopenharmony_ci data[size - 1] = '\n'; 19462306a36Sopenharmony_ci data[size] = '\0'; 19562306a36Sopenharmony_ci ret = simple_read_from_buffer(buf, len, pos, data, size); 19662306a36Sopenharmony_cifree_data: 19762306a36Sopenharmony_ci kfree(data); 19862306a36Sopenharmony_ci return ret; 19962306a36Sopenharmony_ci} 20062306a36Sopenharmony_ci 20162306a36Sopenharmony_cistatic const struct file_operations __fault_opcodes_fops = { 20262306a36Sopenharmony_ci .owner = THIS_MODULE, 20362306a36Sopenharmony_ci .open = fault_opcodes_open, 20462306a36Sopenharmony_ci .read = fault_opcodes_read, 20562306a36Sopenharmony_ci .write = fault_opcodes_write, 20662306a36Sopenharmony_ci .llseek = no_llseek 20762306a36Sopenharmony_ci}; 20862306a36Sopenharmony_ci 20962306a36Sopenharmony_civoid hfi1_fault_exit_debugfs(struct hfi1_ibdev *ibd) 21062306a36Sopenharmony_ci{ 21162306a36Sopenharmony_ci if (ibd->fault) 21262306a36Sopenharmony_ci debugfs_remove_recursive(ibd->fault->dir); 21362306a36Sopenharmony_ci kfree(ibd->fault); 21462306a36Sopenharmony_ci ibd->fault = NULL; 21562306a36Sopenharmony_ci} 21662306a36Sopenharmony_ci 21762306a36Sopenharmony_ciint hfi1_fault_init_debugfs(struct hfi1_ibdev *ibd) 21862306a36Sopenharmony_ci{ 21962306a36Sopenharmony_ci struct dentry *parent = ibd->hfi1_ibdev_dbg; 22062306a36Sopenharmony_ci struct dentry *fault_dir; 22162306a36Sopenharmony_ci 22262306a36Sopenharmony_ci ibd->fault = kzalloc(sizeof(*ibd->fault), GFP_KERNEL); 22362306a36Sopenharmony_ci if (!ibd->fault) 22462306a36Sopenharmony_ci return -ENOMEM; 22562306a36Sopenharmony_ci 22662306a36Sopenharmony_ci ibd->fault->attr.interval = 1; 22762306a36Sopenharmony_ci ibd->fault->attr.require_end = ULONG_MAX; 22862306a36Sopenharmony_ci ibd->fault->attr.stacktrace_depth = 32; 22962306a36Sopenharmony_ci ibd->fault->attr.dname = NULL; 23062306a36Sopenharmony_ci ibd->fault->attr.verbose = 0; 23162306a36Sopenharmony_ci ibd->fault->enable = false; 23262306a36Sopenharmony_ci ibd->fault->opcode = false; 23362306a36Sopenharmony_ci ibd->fault->fault_skip = 0; 23462306a36Sopenharmony_ci ibd->fault->skip = 0; 23562306a36Sopenharmony_ci ibd->fault->direction = HFI1_FAULT_DIR_TXRX; 23662306a36Sopenharmony_ci ibd->fault->suppress_err = false; 23762306a36Sopenharmony_ci bitmap_zero(ibd->fault->opcodes, 23862306a36Sopenharmony_ci sizeof(ibd->fault->opcodes) * BITS_PER_BYTE); 23962306a36Sopenharmony_ci 24062306a36Sopenharmony_ci fault_dir = 24162306a36Sopenharmony_ci fault_create_debugfs_attr("fault", parent, &ibd->fault->attr); 24262306a36Sopenharmony_ci if (IS_ERR(fault_dir)) { 24362306a36Sopenharmony_ci kfree(ibd->fault); 24462306a36Sopenharmony_ci ibd->fault = NULL; 24562306a36Sopenharmony_ci return -ENOENT; 24662306a36Sopenharmony_ci } 24762306a36Sopenharmony_ci ibd->fault->dir = fault_dir; 24862306a36Sopenharmony_ci 24962306a36Sopenharmony_ci debugfs_create_file("fault_stats", 0444, fault_dir, ibd, 25062306a36Sopenharmony_ci &_fault_stats_file_ops); 25162306a36Sopenharmony_ci debugfs_create_bool("enable", 0600, fault_dir, &ibd->fault->enable); 25262306a36Sopenharmony_ci debugfs_create_bool("suppress_err", 0600, fault_dir, 25362306a36Sopenharmony_ci &ibd->fault->suppress_err); 25462306a36Sopenharmony_ci debugfs_create_bool("opcode_mode", 0600, fault_dir, 25562306a36Sopenharmony_ci &ibd->fault->opcode); 25662306a36Sopenharmony_ci debugfs_create_file("opcodes", 0600, fault_dir, ibd->fault, 25762306a36Sopenharmony_ci &__fault_opcodes_fops); 25862306a36Sopenharmony_ci debugfs_create_u64("skip_pkts", 0600, fault_dir, 25962306a36Sopenharmony_ci &ibd->fault->fault_skip); 26062306a36Sopenharmony_ci debugfs_create_u64("skip_usec", 0600, fault_dir, 26162306a36Sopenharmony_ci &ibd->fault->fault_skip_usec); 26262306a36Sopenharmony_ci debugfs_create_u8("direction", 0600, fault_dir, &ibd->fault->direction); 26362306a36Sopenharmony_ci 26462306a36Sopenharmony_ci return 0; 26562306a36Sopenharmony_ci} 26662306a36Sopenharmony_ci 26762306a36Sopenharmony_cibool hfi1_dbg_fault_suppress_err(struct hfi1_ibdev *ibd) 26862306a36Sopenharmony_ci{ 26962306a36Sopenharmony_ci if (ibd->fault) 27062306a36Sopenharmony_ci return ibd->fault->suppress_err; 27162306a36Sopenharmony_ci return false; 27262306a36Sopenharmony_ci} 27362306a36Sopenharmony_ci 27462306a36Sopenharmony_cistatic bool __hfi1_should_fault(struct hfi1_ibdev *ibd, u32 opcode, 27562306a36Sopenharmony_ci u8 direction) 27662306a36Sopenharmony_ci{ 27762306a36Sopenharmony_ci bool ret = false; 27862306a36Sopenharmony_ci 27962306a36Sopenharmony_ci if (!ibd->fault || !ibd->fault->enable) 28062306a36Sopenharmony_ci return false; 28162306a36Sopenharmony_ci if (!(ibd->fault->direction & direction)) 28262306a36Sopenharmony_ci return false; 28362306a36Sopenharmony_ci if (ibd->fault->opcode) { 28462306a36Sopenharmony_ci if (bitmap_empty(ibd->fault->opcodes, 28562306a36Sopenharmony_ci (sizeof(ibd->fault->opcodes) * 28662306a36Sopenharmony_ci BITS_PER_BYTE))) 28762306a36Sopenharmony_ci return false; 28862306a36Sopenharmony_ci if (!(test_bit(opcode, ibd->fault->opcodes))) 28962306a36Sopenharmony_ci return false; 29062306a36Sopenharmony_ci } 29162306a36Sopenharmony_ci if (ibd->fault->fault_skip_usec && 29262306a36Sopenharmony_ci time_before(jiffies, ibd->fault->skip_usec)) 29362306a36Sopenharmony_ci return false; 29462306a36Sopenharmony_ci if (ibd->fault->fault_skip && ibd->fault->skip) { 29562306a36Sopenharmony_ci ibd->fault->skip--; 29662306a36Sopenharmony_ci return false; 29762306a36Sopenharmony_ci } 29862306a36Sopenharmony_ci ret = should_fail(&ibd->fault->attr, 1); 29962306a36Sopenharmony_ci if (ret) { 30062306a36Sopenharmony_ci ibd->fault->skip = ibd->fault->fault_skip; 30162306a36Sopenharmony_ci ibd->fault->skip_usec = jiffies + 30262306a36Sopenharmony_ci usecs_to_jiffies(ibd->fault->fault_skip_usec); 30362306a36Sopenharmony_ci } 30462306a36Sopenharmony_ci return ret; 30562306a36Sopenharmony_ci} 30662306a36Sopenharmony_ci 30762306a36Sopenharmony_cibool hfi1_dbg_should_fault_tx(struct rvt_qp *qp, u32 opcode) 30862306a36Sopenharmony_ci{ 30962306a36Sopenharmony_ci struct hfi1_ibdev *ibd = to_idev(qp->ibqp.device); 31062306a36Sopenharmony_ci 31162306a36Sopenharmony_ci if (__hfi1_should_fault(ibd, opcode, HFI1_FAULT_DIR_TX)) { 31262306a36Sopenharmony_ci trace_hfi1_fault_opcode(qp, opcode); 31362306a36Sopenharmony_ci ibd->fault->n_txfaults[opcode]++; 31462306a36Sopenharmony_ci return true; 31562306a36Sopenharmony_ci } 31662306a36Sopenharmony_ci return false; 31762306a36Sopenharmony_ci} 31862306a36Sopenharmony_ci 31962306a36Sopenharmony_cibool hfi1_dbg_should_fault_rx(struct hfi1_packet *packet) 32062306a36Sopenharmony_ci{ 32162306a36Sopenharmony_ci struct hfi1_ibdev *ibd = &packet->rcd->dd->verbs_dev; 32262306a36Sopenharmony_ci 32362306a36Sopenharmony_ci if (__hfi1_should_fault(ibd, packet->opcode, HFI1_FAULT_DIR_RX)) { 32462306a36Sopenharmony_ci trace_hfi1_fault_packet(packet); 32562306a36Sopenharmony_ci ibd->fault->n_rxfaults[packet->opcode]++; 32662306a36Sopenharmony_ci return true; 32762306a36Sopenharmony_ci } 32862306a36Sopenharmony_ci return false; 32962306a36Sopenharmony_ci} 330