fault.c 8.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329
  1. // SPDX-License-Identifier: GPL-2.0 or BSD-3-Clause
  2. /*
  3. * Copyright(c) 2018 Intel Corporation.
  4. */
  5. #include <linux/debugfs.h>
  6. #include <linux/seq_file.h>
  7. #include <linux/kernel.h>
  8. #include <linux/types.h>
  9. #include <linux/bitmap.h>
  10. #include "debugfs.h"
  11. #include "fault.h"
  12. #include "trace.h"
  13. #define HFI1_FAULT_DIR_TX BIT(0)
  14. #define HFI1_FAULT_DIR_RX BIT(1)
  15. #define HFI1_FAULT_DIR_TXRX (HFI1_FAULT_DIR_TX | HFI1_FAULT_DIR_RX)
  16. static void *_fault_stats_seq_start(struct seq_file *s, loff_t *pos)
  17. {
  18. struct hfi1_opcode_stats_perctx *opstats;
  19. if (*pos >= ARRAY_SIZE(opstats->stats))
  20. return NULL;
  21. return pos;
  22. }
  23. static void *_fault_stats_seq_next(struct seq_file *s, void *v, loff_t *pos)
  24. {
  25. struct hfi1_opcode_stats_perctx *opstats;
  26. ++*pos;
  27. if (*pos >= ARRAY_SIZE(opstats->stats))
  28. return NULL;
  29. return pos;
  30. }
  31. static void _fault_stats_seq_stop(struct seq_file *s, void *v)
  32. {
  33. }
  34. static int _fault_stats_seq_show(struct seq_file *s, void *v)
  35. {
  36. loff_t *spos = v;
  37. loff_t i = *spos, j;
  38. u64 n_packets = 0, n_bytes = 0;
  39. struct hfi1_ibdev *ibd = (struct hfi1_ibdev *)s->private;
  40. struct hfi1_devdata *dd = dd_from_dev(ibd);
  41. struct hfi1_ctxtdata *rcd;
  42. for (j = 0; j < dd->first_dyn_alloc_ctxt; j++) {
  43. rcd = hfi1_rcd_get_by_index(dd, j);
  44. if (rcd) {
  45. n_packets += rcd->opstats->stats[i].n_packets;
  46. n_bytes += rcd->opstats->stats[i].n_bytes;
  47. }
  48. hfi1_rcd_put(rcd);
  49. }
  50. for_each_possible_cpu(j) {
  51. struct hfi1_opcode_stats_perctx *sp =
  52. per_cpu_ptr(dd->tx_opstats, j);
  53. n_packets += sp->stats[i].n_packets;
  54. n_bytes += sp->stats[i].n_bytes;
  55. }
  56. if (!n_packets && !n_bytes)
  57. return SEQ_SKIP;
  58. if (!ibd->fault->n_rxfaults[i] && !ibd->fault->n_txfaults[i])
  59. return SEQ_SKIP;
  60. seq_printf(s, "%02llx %llu/%llu (faults rx:%llu faults: tx:%llu)\n", i,
  61. (unsigned long long)n_packets,
  62. (unsigned long long)n_bytes,
  63. (unsigned long long)ibd->fault->n_rxfaults[i],
  64. (unsigned long long)ibd->fault->n_txfaults[i]);
  65. return 0;
  66. }
  67. DEBUGFS_SEQ_FILE_OPS(fault_stats);
  68. DEBUGFS_SEQ_FILE_OPEN(fault_stats);
  69. DEBUGFS_FILE_OPS(fault_stats);
  70. static int fault_opcodes_open(struct inode *inode, struct file *file)
  71. {
  72. file->private_data = inode->i_private;
  73. return nonseekable_open(inode, file);
  74. }
  75. static ssize_t fault_opcodes_write(struct file *file, const char __user *buf,
  76. size_t len, loff_t *pos)
  77. {
  78. ssize_t ret = 0;
  79. /* 1280 = 256 opcodes * 4 chars/opcode + 255 commas + NULL */
  80. size_t copy, datalen = 1280;
  81. char *data, *token, *ptr, *end;
  82. struct fault *fault = file->private_data;
  83. data = kcalloc(datalen, sizeof(*data), GFP_KERNEL);
  84. if (!data)
  85. return -ENOMEM;
  86. copy = min(len, datalen - 1);
  87. if (copy_from_user(data, buf, copy)) {
  88. ret = -EFAULT;
  89. goto free_data;
  90. }
  91. ret = debugfs_file_get(file->f_path.dentry);
  92. if (unlikely(ret))
  93. goto free_data;
  94. ptr = data;
  95. token = ptr;
  96. for (ptr = data; *ptr; ptr = end + 1, token = ptr) {
  97. char *dash;
  98. unsigned long range_start, range_end, i;
  99. bool remove = false;
  100. unsigned long bound = 1U << BITS_PER_BYTE;
  101. end = strchr(ptr, ',');
  102. if (end)
  103. *end = '\0';
  104. if (token[0] == '-') {
  105. remove = true;
  106. token++;
  107. }
  108. dash = strchr(token, '-');
  109. if (dash)
  110. *dash = '\0';
  111. if (kstrtoul(token, 0, &range_start))
  112. break;
  113. if (dash) {
  114. token = dash + 1;
  115. if (kstrtoul(token, 0, &range_end))
  116. break;
  117. } else {
  118. range_end = range_start;
  119. }
  120. if (range_start == range_end && range_start == -1UL) {
  121. bitmap_zero(fault->opcodes, sizeof(fault->opcodes) *
  122. BITS_PER_BYTE);
  123. break;
  124. }
  125. /* Check the inputs */
  126. if (range_start >= bound || range_end >= bound)
  127. break;
  128. for (i = range_start; i <= range_end; i++) {
  129. if (remove)
  130. clear_bit(i, fault->opcodes);
  131. else
  132. set_bit(i, fault->opcodes);
  133. }
  134. if (!end)
  135. break;
  136. }
  137. ret = len;
  138. debugfs_file_put(file->f_path.dentry);
  139. free_data:
  140. kfree(data);
  141. return ret;
  142. }
  143. static ssize_t fault_opcodes_read(struct file *file, char __user *buf,
  144. size_t len, loff_t *pos)
  145. {
  146. ssize_t ret = 0;
  147. char *data;
  148. size_t datalen = 1280, size = 0; /* see fault_opcodes_write() */
  149. unsigned long bit = 0, zero = 0;
  150. struct fault *fault = file->private_data;
  151. size_t bitsize = sizeof(fault->opcodes) * BITS_PER_BYTE;
  152. data = kcalloc(datalen, sizeof(*data), GFP_KERNEL);
  153. if (!data)
  154. return -ENOMEM;
  155. ret = debugfs_file_get(file->f_path.dentry);
  156. if (unlikely(ret))
  157. goto free_data;
  158. bit = find_first_bit(fault->opcodes, bitsize);
  159. while (bit < bitsize) {
  160. zero = find_next_zero_bit(fault->opcodes, bitsize, bit);
  161. if (zero - 1 != bit)
  162. size += scnprintf(data + size,
  163. datalen - size - 1,
  164. "0x%lx-0x%lx,", bit, zero - 1);
  165. else
  166. size += scnprintf(data + size,
  167. datalen - size - 1, "0x%lx,",
  168. bit);
  169. bit = find_next_bit(fault->opcodes, bitsize, zero);
  170. }
  171. debugfs_file_put(file->f_path.dentry);
  172. data[size - 1] = '\n';
  173. data[size] = '\0';
  174. ret = simple_read_from_buffer(buf, len, pos, data, size);
  175. free_data:
  176. kfree(data);
  177. return ret;
  178. }
  179. static const struct file_operations __fault_opcodes_fops = {
  180. .owner = THIS_MODULE,
  181. .open = fault_opcodes_open,
  182. .read = fault_opcodes_read,
  183. .write = fault_opcodes_write,
  184. .llseek = no_llseek
  185. };
  186. void hfi1_fault_exit_debugfs(struct hfi1_ibdev *ibd)
  187. {
  188. if (ibd->fault)
  189. debugfs_remove_recursive(ibd->fault->dir);
  190. kfree(ibd->fault);
  191. ibd->fault = NULL;
  192. }
  193. int hfi1_fault_init_debugfs(struct hfi1_ibdev *ibd)
  194. {
  195. struct dentry *parent = ibd->hfi1_ibdev_dbg;
  196. struct dentry *fault_dir;
  197. ibd->fault = kzalloc(sizeof(*ibd->fault), GFP_KERNEL);
  198. if (!ibd->fault)
  199. return -ENOMEM;
  200. ibd->fault->attr.interval = 1;
  201. ibd->fault->attr.require_end = ULONG_MAX;
  202. ibd->fault->attr.stacktrace_depth = 32;
  203. ibd->fault->attr.dname = NULL;
  204. ibd->fault->attr.verbose = 0;
  205. ibd->fault->enable = false;
  206. ibd->fault->opcode = false;
  207. ibd->fault->fault_skip = 0;
  208. ibd->fault->skip = 0;
  209. ibd->fault->direction = HFI1_FAULT_DIR_TXRX;
  210. ibd->fault->suppress_err = false;
  211. bitmap_zero(ibd->fault->opcodes,
  212. sizeof(ibd->fault->opcodes) * BITS_PER_BYTE);
  213. fault_dir =
  214. fault_create_debugfs_attr("fault", parent, &ibd->fault->attr);
  215. if (IS_ERR(fault_dir)) {
  216. kfree(ibd->fault);
  217. ibd->fault = NULL;
  218. return -ENOENT;
  219. }
  220. ibd->fault->dir = fault_dir;
  221. debugfs_create_file("fault_stats", 0444, fault_dir, ibd,
  222. &_fault_stats_file_ops);
  223. debugfs_create_bool("enable", 0600, fault_dir, &ibd->fault->enable);
  224. debugfs_create_bool("suppress_err", 0600, fault_dir,
  225. &ibd->fault->suppress_err);
  226. debugfs_create_bool("opcode_mode", 0600, fault_dir,
  227. &ibd->fault->opcode);
  228. debugfs_create_file("opcodes", 0600, fault_dir, ibd->fault,
  229. &__fault_opcodes_fops);
  230. debugfs_create_u64("skip_pkts", 0600, fault_dir,
  231. &ibd->fault->fault_skip);
  232. debugfs_create_u64("skip_usec", 0600, fault_dir,
  233. &ibd->fault->fault_skip_usec);
  234. debugfs_create_u8("direction", 0600, fault_dir, &ibd->fault->direction);
  235. return 0;
  236. }
  237. bool hfi1_dbg_fault_suppress_err(struct hfi1_ibdev *ibd)
  238. {
  239. if (ibd->fault)
  240. return ibd->fault->suppress_err;
  241. return false;
  242. }
  243. static bool __hfi1_should_fault(struct hfi1_ibdev *ibd, u32 opcode,
  244. u8 direction)
  245. {
  246. bool ret = false;
  247. if (!ibd->fault || !ibd->fault->enable)
  248. return false;
  249. if (!(ibd->fault->direction & direction))
  250. return false;
  251. if (ibd->fault->opcode) {
  252. if (bitmap_empty(ibd->fault->opcodes,
  253. (sizeof(ibd->fault->opcodes) *
  254. BITS_PER_BYTE)))
  255. return false;
  256. if (!(test_bit(opcode, ibd->fault->opcodes)))
  257. return false;
  258. }
  259. if (ibd->fault->fault_skip_usec &&
  260. time_before(jiffies, ibd->fault->skip_usec))
  261. return false;
  262. if (ibd->fault->fault_skip && ibd->fault->skip) {
  263. ibd->fault->skip--;
  264. return false;
  265. }
  266. ret = should_fail(&ibd->fault->attr, 1);
  267. if (ret) {
  268. ibd->fault->skip = ibd->fault->fault_skip;
  269. ibd->fault->skip_usec = jiffies +
  270. usecs_to_jiffies(ibd->fault->fault_skip_usec);
  271. }
  272. return ret;
  273. }
  274. bool hfi1_dbg_should_fault_tx(struct rvt_qp *qp, u32 opcode)
  275. {
  276. struct hfi1_ibdev *ibd = to_idev(qp->ibqp.device);
  277. if (__hfi1_should_fault(ibd, opcode, HFI1_FAULT_DIR_TX)) {
  278. trace_hfi1_fault_opcode(qp, opcode);
  279. ibd->fault->n_txfaults[opcode]++;
  280. return true;
  281. }
  282. return false;
  283. }
  284. bool hfi1_dbg_should_fault_rx(struct hfi1_packet *packet)
  285. {
  286. struct hfi1_ibdev *ibd = &packet->rcd->dd->verbs_dev;
  287. if (__hfi1_should_fault(ibd, packet->opcode, HFI1_FAULT_DIR_RX)) {
  288. trace_hfi1_fault_packet(packet);
  289. ibd->fault->n_rxfaults[packet->opcode]++;
  290. return true;
  291. }
  292. return false;
  293. }