1*145eba1aSCai Huoqing // SPDX-License-Identifier: GPL-2.0 or BSD-3-Clause
2a74d5307SMitko Haralanov /*
3a74d5307SMitko Haralanov * Copyright(c) 2018 Intel Corporation.
4a74d5307SMitko Haralanov */
5*145eba1aSCai Huoqing
6a74d5307SMitko Haralanov #include <linux/debugfs.h>
7a74d5307SMitko Haralanov #include <linux/seq_file.h>
8a74d5307SMitko Haralanov #include <linux/kernel.h>
9a74d5307SMitko Haralanov #include <linux/types.h>
10a74d5307SMitko Haralanov #include <linux/bitmap.h>
11a74d5307SMitko Haralanov
12a74d5307SMitko Haralanov #include "debugfs.h"
13a74d5307SMitko Haralanov #include "fault.h"
14a74d5307SMitko Haralanov #include "trace.h"
15a74d5307SMitko Haralanov
16a74d5307SMitko Haralanov #define HFI1_FAULT_DIR_TX BIT(0)
17a74d5307SMitko Haralanov #define HFI1_FAULT_DIR_RX BIT(1)
18a74d5307SMitko Haralanov #define HFI1_FAULT_DIR_TXRX (HFI1_FAULT_DIR_TX | HFI1_FAULT_DIR_RX)
19a74d5307SMitko Haralanov
_fault_stats_seq_start(struct seq_file * s,loff_t * pos)20a74d5307SMitko Haralanov static void *_fault_stats_seq_start(struct seq_file *s, loff_t *pos)
21a74d5307SMitko Haralanov {
22a74d5307SMitko Haralanov struct hfi1_opcode_stats_perctx *opstats;
23a74d5307SMitko Haralanov
24a74d5307SMitko Haralanov if (*pos >= ARRAY_SIZE(opstats->stats))
25a74d5307SMitko Haralanov return NULL;
26a74d5307SMitko Haralanov return pos;
27a74d5307SMitko Haralanov }
28a74d5307SMitko Haralanov
_fault_stats_seq_next(struct seq_file * s,void * v,loff_t * pos)29a74d5307SMitko Haralanov static void *_fault_stats_seq_next(struct seq_file *s, void *v, loff_t *pos)
30a74d5307SMitko Haralanov {
31a74d5307SMitko Haralanov struct hfi1_opcode_stats_perctx *opstats;
32a74d5307SMitko Haralanov
33a74d5307SMitko Haralanov ++*pos;
34a74d5307SMitko Haralanov if (*pos >= ARRAY_SIZE(opstats->stats))
35a74d5307SMitko Haralanov return NULL;
36a74d5307SMitko Haralanov return pos;
37a74d5307SMitko Haralanov }
38a74d5307SMitko Haralanov
_fault_stats_seq_stop(struct seq_file * s,void * v)39a74d5307SMitko Haralanov static void _fault_stats_seq_stop(struct seq_file *s, void *v)
40a74d5307SMitko Haralanov {
41a74d5307SMitko Haralanov }
42a74d5307SMitko Haralanov
_fault_stats_seq_show(struct seq_file * s,void * v)43a74d5307SMitko Haralanov static int _fault_stats_seq_show(struct seq_file *s, void *v)
44a74d5307SMitko Haralanov {
45a74d5307SMitko Haralanov loff_t *spos = v;
46a74d5307SMitko Haralanov loff_t i = *spos, j;
47a74d5307SMitko Haralanov u64 n_packets = 0, n_bytes = 0;
48a74d5307SMitko Haralanov struct hfi1_ibdev *ibd = (struct hfi1_ibdev *)s->private;
49a74d5307SMitko Haralanov struct hfi1_devdata *dd = dd_from_dev(ibd);
50a74d5307SMitko Haralanov struct hfi1_ctxtdata *rcd;
51a74d5307SMitko Haralanov
52a74d5307SMitko Haralanov for (j = 0; j < dd->first_dyn_alloc_ctxt; j++) {
53a74d5307SMitko Haralanov rcd = hfi1_rcd_get_by_index(dd, j);
54a74d5307SMitko Haralanov if (rcd) {
55a74d5307SMitko Haralanov n_packets += rcd->opstats->stats[i].n_packets;
56a74d5307SMitko Haralanov n_bytes += rcd->opstats->stats[i].n_bytes;
57a74d5307SMitko Haralanov }
58a74d5307SMitko Haralanov hfi1_rcd_put(rcd);
59a74d5307SMitko Haralanov }
60a74d5307SMitko Haralanov for_each_possible_cpu(j) {
61a74d5307SMitko Haralanov struct hfi1_opcode_stats_perctx *sp =
62a74d5307SMitko Haralanov per_cpu_ptr(dd->tx_opstats, j);
63a74d5307SMitko Haralanov
64a74d5307SMitko Haralanov n_packets += sp->stats[i].n_packets;
65a74d5307SMitko Haralanov n_bytes += sp->stats[i].n_bytes;
66a74d5307SMitko Haralanov }
67a74d5307SMitko Haralanov if (!n_packets && !n_bytes)
68a74d5307SMitko Haralanov return SEQ_SKIP;
69a74d5307SMitko Haralanov if (!ibd->fault->n_rxfaults[i] && !ibd->fault->n_txfaults[i])
70a74d5307SMitko Haralanov return SEQ_SKIP;
71a74d5307SMitko Haralanov seq_printf(s, "%02llx %llu/%llu (faults rx:%llu faults: tx:%llu)\n", i,
72a74d5307SMitko Haralanov (unsigned long long)n_packets,
73a74d5307SMitko Haralanov (unsigned long long)n_bytes,
74a74d5307SMitko Haralanov (unsigned long long)ibd->fault->n_rxfaults[i],
75a74d5307SMitko Haralanov (unsigned long long)ibd->fault->n_txfaults[i]);
76a74d5307SMitko Haralanov return 0;
77a74d5307SMitko Haralanov }
78a74d5307SMitko Haralanov
79a74d5307SMitko Haralanov DEBUGFS_SEQ_FILE_OPS(fault_stats);
80a74d5307SMitko Haralanov DEBUGFS_SEQ_FILE_OPEN(fault_stats);
81a74d5307SMitko Haralanov DEBUGFS_FILE_OPS(fault_stats);
82a74d5307SMitko Haralanov
fault_opcodes_open(struct inode * inode,struct file * file)83a74d5307SMitko Haralanov static int fault_opcodes_open(struct inode *inode, struct file *file)
84a74d5307SMitko Haralanov {
85a74d5307SMitko Haralanov file->private_data = inode->i_private;
86a74d5307SMitko Haralanov return nonseekable_open(inode, file);
87a74d5307SMitko Haralanov }
88a74d5307SMitko Haralanov
fault_opcodes_write(struct file * file,const char __user * buf,size_t len,loff_t * pos)89a74d5307SMitko Haralanov static ssize_t fault_opcodes_write(struct file *file, const char __user *buf,
90a74d5307SMitko Haralanov size_t len, loff_t *pos)
91a74d5307SMitko Haralanov {
92a74d5307SMitko Haralanov ssize_t ret = 0;
93a74d5307SMitko Haralanov /* 1280 = 256 opcodes * 4 chars/opcode + 255 commas + NULL */
94a74d5307SMitko Haralanov size_t copy, datalen = 1280;
95a74d5307SMitko Haralanov char *data, *token, *ptr, *end;
96a74d5307SMitko Haralanov struct fault *fault = file->private_data;
97a74d5307SMitko Haralanov
98a74d5307SMitko Haralanov data = kcalloc(datalen, sizeof(*data), GFP_KERNEL);
99a74d5307SMitko Haralanov if (!data)
100a74d5307SMitko Haralanov return -ENOMEM;
101a74d5307SMitko Haralanov copy = min(len, datalen - 1);
1022323d7baSWenwen Wang if (copy_from_user(data, buf, copy)) {
1032323d7baSWenwen Wang ret = -EFAULT;
1042323d7baSWenwen Wang goto free_data;
1052323d7baSWenwen Wang }
106a74d5307SMitko Haralanov
107a74d5307SMitko Haralanov ret = debugfs_file_get(file->f_path.dentry);
108a74d5307SMitko Haralanov if (unlikely(ret))
1092323d7baSWenwen Wang goto free_data;
110a74d5307SMitko Haralanov ptr = data;
111a74d5307SMitko Haralanov token = ptr;
112a74d5307SMitko Haralanov for (ptr = data; *ptr; ptr = end + 1, token = ptr) {
113a74d5307SMitko Haralanov char *dash;
114a74d5307SMitko Haralanov unsigned long range_start, range_end, i;
115a74d5307SMitko Haralanov bool remove = false;
1165f90677eSKaike Wan unsigned long bound = 1U << BITS_PER_BYTE;
117a74d5307SMitko Haralanov
118a74d5307SMitko Haralanov end = strchr(ptr, ',');
119a74d5307SMitko Haralanov if (end)
120a74d5307SMitko Haralanov *end = '\0';
121a74d5307SMitko Haralanov if (token[0] == '-') {
122a74d5307SMitko Haralanov remove = true;
123a74d5307SMitko Haralanov token++;
124a74d5307SMitko Haralanov }
125a74d5307SMitko Haralanov dash = strchr(token, '-');
126a74d5307SMitko Haralanov if (dash)
127a74d5307SMitko Haralanov *dash = '\0';
128a74d5307SMitko Haralanov if (kstrtoul(token, 0, &range_start))
129a74d5307SMitko Haralanov break;
130a74d5307SMitko Haralanov if (dash) {
131a74d5307SMitko Haralanov token = dash + 1;
132a74d5307SMitko Haralanov if (kstrtoul(token, 0, &range_end))
133a74d5307SMitko Haralanov break;
134a74d5307SMitko Haralanov } else {
135a74d5307SMitko Haralanov range_end = range_start;
136a74d5307SMitko Haralanov }
137a74d5307SMitko Haralanov if (range_start == range_end && range_start == -1UL) {
138a74d5307SMitko Haralanov bitmap_zero(fault->opcodes, sizeof(fault->opcodes) *
139a74d5307SMitko Haralanov BITS_PER_BYTE);
140a74d5307SMitko Haralanov break;
141a74d5307SMitko Haralanov }
1425f90677eSKaike Wan /* Check the inputs */
1435f90677eSKaike Wan if (range_start >= bound || range_end >= bound)
1445f90677eSKaike Wan break;
1455f90677eSKaike Wan
146a74d5307SMitko Haralanov for (i = range_start; i <= range_end; i++) {
147a74d5307SMitko Haralanov if (remove)
148a74d5307SMitko Haralanov clear_bit(i, fault->opcodes);
149a74d5307SMitko Haralanov else
150a74d5307SMitko Haralanov set_bit(i, fault->opcodes);
151a74d5307SMitko Haralanov }
152a74d5307SMitko Haralanov if (!end)
153a74d5307SMitko Haralanov break;
154a74d5307SMitko Haralanov }
155a74d5307SMitko Haralanov ret = len;
156a74d5307SMitko Haralanov
157a74d5307SMitko Haralanov debugfs_file_put(file->f_path.dentry);
1582323d7baSWenwen Wang free_data:
159a74d5307SMitko Haralanov kfree(data);
160a74d5307SMitko Haralanov return ret;
161a74d5307SMitko Haralanov }
162a74d5307SMitko Haralanov
fault_opcodes_read(struct file * file,char __user * buf,size_t len,loff_t * pos)163a74d5307SMitko Haralanov static ssize_t fault_opcodes_read(struct file *file, char __user *buf,
164a74d5307SMitko Haralanov size_t len, loff_t *pos)
165a74d5307SMitko Haralanov {
166a74d5307SMitko Haralanov ssize_t ret = 0;
167a74d5307SMitko Haralanov char *data;
168a74d5307SMitko Haralanov size_t datalen = 1280, size = 0; /* see fault_opcodes_write() */
169a74d5307SMitko Haralanov unsigned long bit = 0, zero = 0;
170a74d5307SMitko Haralanov struct fault *fault = file->private_data;
171a74d5307SMitko Haralanov size_t bitsize = sizeof(fault->opcodes) * BITS_PER_BYTE;
172a74d5307SMitko Haralanov
173a74d5307SMitko Haralanov data = kcalloc(datalen, sizeof(*data), GFP_KERNEL);
174a74d5307SMitko Haralanov if (!data)
175a74d5307SMitko Haralanov return -ENOMEM;
176a74d5307SMitko Haralanov ret = debugfs_file_get(file->f_path.dentry);
177a74d5307SMitko Haralanov if (unlikely(ret))
178b08afa06SWenwen Wang goto free_data;
179a74d5307SMitko Haralanov bit = find_first_bit(fault->opcodes, bitsize);
180a74d5307SMitko Haralanov while (bit < bitsize) {
181a74d5307SMitko Haralanov zero = find_next_zero_bit(fault->opcodes, bitsize, bit);
182a74d5307SMitko Haralanov if (zero - 1 != bit)
18323ab5261STakashi Iwai size += scnprintf(data + size,
184a74d5307SMitko Haralanov datalen - size - 1,
185a74d5307SMitko Haralanov "0x%lx-0x%lx,", bit, zero - 1);
186a74d5307SMitko Haralanov else
18723ab5261STakashi Iwai size += scnprintf(data + size,
188a74d5307SMitko Haralanov datalen - size - 1, "0x%lx,",
189a74d5307SMitko Haralanov bit);
190a74d5307SMitko Haralanov bit = find_next_bit(fault->opcodes, bitsize, zero);
191a74d5307SMitko Haralanov }
192a74d5307SMitko Haralanov debugfs_file_put(file->f_path.dentry);
193a74d5307SMitko Haralanov data[size - 1] = '\n';
194a74d5307SMitko Haralanov data[size] = '\0';
195a74d5307SMitko Haralanov ret = simple_read_from_buffer(buf, len, pos, data, size);
196b08afa06SWenwen Wang free_data:
197a74d5307SMitko Haralanov kfree(data);
198a74d5307SMitko Haralanov return ret;
199a74d5307SMitko Haralanov }
200a74d5307SMitko Haralanov
201a74d5307SMitko Haralanov static const struct file_operations __fault_opcodes_fops = {
202a74d5307SMitko Haralanov .owner = THIS_MODULE,
203a74d5307SMitko Haralanov .open = fault_opcodes_open,
204a74d5307SMitko Haralanov .read = fault_opcodes_read,
205a74d5307SMitko Haralanov .write = fault_opcodes_write,
206a74d5307SMitko Haralanov .llseek = no_llseek
207a74d5307SMitko Haralanov };
208a74d5307SMitko Haralanov
hfi1_fault_exit_debugfs(struct hfi1_ibdev * ibd)209a74d5307SMitko Haralanov void hfi1_fault_exit_debugfs(struct hfi1_ibdev *ibd)
210a74d5307SMitko Haralanov {
211a74d5307SMitko Haralanov if (ibd->fault)
212a74d5307SMitko Haralanov debugfs_remove_recursive(ibd->fault->dir);
213a74d5307SMitko Haralanov kfree(ibd->fault);
214a74d5307SMitko Haralanov ibd->fault = NULL;
215a74d5307SMitko Haralanov }
216a74d5307SMitko Haralanov
hfi1_fault_init_debugfs(struct hfi1_ibdev * ibd)217a74d5307SMitko Haralanov int hfi1_fault_init_debugfs(struct hfi1_ibdev *ibd)
218a74d5307SMitko Haralanov {
219a74d5307SMitko Haralanov struct dentry *parent = ibd->hfi1_ibdev_dbg;
220e7751180SGreg Kroah-Hartman struct dentry *fault_dir;
221a74d5307SMitko Haralanov
222a74d5307SMitko Haralanov ibd->fault = kzalloc(sizeof(*ibd->fault), GFP_KERNEL);
223a74d5307SMitko Haralanov if (!ibd->fault)
224a74d5307SMitko Haralanov return -ENOMEM;
225a74d5307SMitko Haralanov
226a74d5307SMitko Haralanov ibd->fault->attr.interval = 1;
227a74d5307SMitko Haralanov ibd->fault->attr.require_end = ULONG_MAX;
228a74d5307SMitko Haralanov ibd->fault->attr.stacktrace_depth = 32;
229a74d5307SMitko Haralanov ibd->fault->attr.dname = NULL;
230a74d5307SMitko Haralanov ibd->fault->attr.verbose = 0;
231a74d5307SMitko Haralanov ibd->fault->enable = false;
232a74d5307SMitko Haralanov ibd->fault->opcode = false;
233a74d5307SMitko Haralanov ibd->fault->fault_skip = 0;
234a74d5307SMitko Haralanov ibd->fault->skip = 0;
235a74d5307SMitko Haralanov ibd->fault->direction = HFI1_FAULT_DIR_TXRX;
236a74d5307SMitko Haralanov ibd->fault->suppress_err = false;
237a74d5307SMitko Haralanov bitmap_zero(ibd->fault->opcodes,
238a74d5307SMitko Haralanov sizeof(ibd->fault->opcodes) * BITS_PER_BYTE);
239a74d5307SMitko Haralanov
240e7751180SGreg Kroah-Hartman fault_dir =
241e7751180SGreg Kroah-Hartman fault_create_debugfs_attr("fault", parent, &ibd->fault->attr);
242e7751180SGreg Kroah-Hartman if (IS_ERR(fault_dir)) {
243a74d5307SMitko Haralanov kfree(ibd->fault);
244a74d5307SMitko Haralanov ibd->fault = NULL;
245a74d5307SMitko Haralanov return -ENOENT;
246a74d5307SMitko Haralanov }
247e7751180SGreg Kroah-Hartman ibd->fault->dir = fault_dir;
248a74d5307SMitko Haralanov
249e7751180SGreg Kroah-Hartman debugfs_create_file("fault_stats", 0444, fault_dir, ibd,
2505c432764SGreg Kroah-Hartman &_fault_stats_file_ops);
251e7751180SGreg Kroah-Hartman debugfs_create_bool("enable", 0600, fault_dir, &ibd->fault->enable);
252e7751180SGreg Kroah-Hartman debugfs_create_bool("suppress_err", 0600, fault_dir,
253e7751180SGreg Kroah-Hartman &ibd->fault->suppress_err);
254e7751180SGreg Kroah-Hartman debugfs_create_bool("opcode_mode", 0600, fault_dir,
255e7751180SGreg Kroah-Hartman &ibd->fault->opcode);
256e7751180SGreg Kroah-Hartman debugfs_create_file("opcodes", 0600, fault_dir, ibd->fault,
257e7751180SGreg Kroah-Hartman &__fault_opcodes_fops);
258e7751180SGreg Kroah-Hartman debugfs_create_u64("skip_pkts", 0600, fault_dir,
259e7751180SGreg Kroah-Hartman &ibd->fault->fault_skip);
260e7751180SGreg Kroah-Hartman debugfs_create_u64("skip_usec", 0600, fault_dir,
261e7751180SGreg Kroah-Hartman &ibd->fault->fault_skip_usec);
262e7751180SGreg Kroah-Hartman debugfs_create_u8("direction", 0600, fault_dir, &ibd->fault->direction);
263a74d5307SMitko Haralanov
264a74d5307SMitko Haralanov return 0;
265a74d5307SMitko Haralanov }
266a74d5307SMitko Haralanov
hfi1_dbg_fault_suppress_err(struct hfi1_ibdev * ibd)267a74d5307SMitko Haralanov bool hfi1_dbg_fault_suppress_err(struct hfi1_ibdev *ibd)
268a74d5307SMitko Haralanov {
269a74d5307SMitko Haralanov if (ibd->fault)
270a74d5307SMitko Haralanov return ibd->fault->suppress_err;
271a74d5307SMitko Haralanov return false;
272a74d5307SMitko Haralanov }
273a74d5307SMitko Haralanov
__hfi1_should_fault(struct hfi1_ibdev * ibd,u32 opcode,u8 direction)274a74d5307SMitko Haralanov static bool __hfi1_should_fault(struct hfi1_ibdev *ibd, u32 opcode,
275a74d5307SMitko Haralanov u8 direction)
276a74d5307SMitko Haralanov {
277a74d5307SMitko Haralanov bool ret = false;
278a74d5307SMitko Haralanov
279a74d5307SMitko Haralanov if (!ibd->fault || !ibd->fault->enable)
280a74d5307SMitko Haralanov return false;
281a74d5307SMitko Haralanov if (!(ibd->fault->direction & direction))
282a74d5307SMitko Haralanov return false;
283a74d5307SMitko Haralanov if (ibd->fault->opcode) {
284a74d5307SMitko Haralanov if (bitmap_empty(ibd->fault->opcodes,
285a74d5307SMitko Haralanov (sizeof(ibd->fault->opcodes) *
286a74d5307SMitko Haralanov BITS_PER_BYTE)))
287a74d5307SMitko Haralanov return false;
288a74d5307SMitko Haralanov if (!(test_bit(opcode, ibd->fault->opcodes)))
289a74d5307SMitko Haralanov return false;
290a74d5307SMitko Haralanov }
291a74d5307SMitko Haralanov if (ibd->fault->fault_skip_usec &&
292a74d5307SMitko Haralanov time_before(jiffies, ibd->fault->skip_usec))
293a74d5307SMitko Haralanov return false;
294a74d5307SMitko Haralanov if (ibd->fault->fault_skip && ibd->fault->skip) {
295a74d5307SMitko Haralanov ibd->fault->skip--;
296a74d5307SMitko Haralanov return false;
297a74d5307SMitko Haralanov }
298a74d5307SMitko Haralanov ret = should_fail(&ibd->fault->attr, 1);
299a74d5307SMitko Haralanov if (ret) {
300a74d5307SMitko Haralanov ibd->fault->skip = ibd->fault->fault_skip;
301a74d5307SMitko Haralanov ibd->fault->skip_usec = jiffies +
302a74d5307SMitko Haralanov usecs_to_jiffies(ibd->fault->fault_skip_usec);
303a74d5307SMitko Haralanov }
304a74d5307SMitko Haralanov return ret;
305a74d5307SMitko Haralanov }
306a74d5307SMitko Haralanov
hfi1_dbg_should_fault_tx(struct rvt_qp * qp,u32 opcode)307a74d5307SMitko Haralanov bool hfi1_dbg_should_fault_tx(struct rvt_qp *qp, u32 opcode)
308a74d5307SMitko Haralanov {
309a74d5307SMitko Haralanov struct hfi1_ibdev *ibd = to_idev(qp->ibqp.device);
310a74d5307SMitko Haralanov
311a74d5307SMitko Haralanov if (__hfi1_should_fault(ibd, opcode, HFI1_FAULT_DIR_TX)) {
312a74d5307SMitko Haralanov trace_hfi1_fault_opcode(qp, opcode);
313a74d5307SMitko Haralanov ibd->fault->n_txfaults[opcode]++;
314a74d5307SMitko Haralanov return true;
315a74d5307SMitko Haralanov }
316a74d5307SMitko Haralanov return false;
317a74d5307SMitko Haralanov }
318a74d5307SMitko Haralanov
hfi1_dbg_should_fault_rx(struct hfi1_packet * packet)319a74d5307SMitko Haralanov bool hfi1_dbg_should_fault_rx(struct hfi1_packet *packet)
320a74d5307SMitko Haralanov {
321a74d5307SMitko Haralanov struct hfi1_ibdev *ibd = &packet->rcd->dd->verbs_dev;
322a74d5307SMitko Haralanov
323a74d5307SMitko Haralanov if (__hfi1_should_fault(ibd, packet->opcode, HFI1_FAULT_DIR_RX)) {
324a74d5307SMitko Haralanov trace_hfi1_fault_packet(packet);
325a74d5307SMitko Haralanov ibd->fault->n_rxfaults[packet->opcode]++;
326a74d5307SMitko Haralanov return true;
327a74d5307SMitko Haralanov }
328a74d5307SMitko Haralanov return false;
329a74d5307SMitko Haralanov }
330