erdma_eq.c 7.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320
  1. // SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause
  2. /* Authors: Cheng Xu <[email protected]> */
  3. /* Kai Shen <[email protected]> */
  4. /* Copyright (c) 2020-2022, Alibaba Group. */
  5. #include "erdma_verbs.h"
  6. #define MAX_POLL_CHUNK_SIZE 16
  7. void notify_eq(struct erdma_eq *eq)
  8. {
  9. u64 db_data = FIELD_PREP(ERDMA_EQDB_CI_MASK, eq->ci) |
  10. FIELD_PREP(ERDMA_EQDB_ARM_MASK, 1);
  11. *eq->db_record = db_data;
  12. writeq(db_data, eq->db_addr);
  13. atomic64_inc(&eq->notify_num);
  14. }
  15. void *get_next_valid_eqe(struct erdma_eq *eq)
  16. {
  17. u64 *eqe = get_queue_entry(eq->qbuf, eq->ci, eq->depth, EQE_SHIFT);
  18. u32 owner = FIELD_GET(ERDMA_CEQE_HDR_O_MASK, READ_ONCE(*eqe));
  19. return owner ^ !!(eq->ci & eq->depth) ? eqe : NULL;
  20. }
  21. void erdma_aeq_event_handler(struct erdma_dev *dev)
  22. {
  23. struct erdma_aeqe *aeqe;
  24. u32 cqn, qpn;
  25. struct erdma_qp *qp;
  26. struct erdma_cq *cq;
  27. struct ib_event event;
  28. u32 poll_cnt = 0;
  29. memset(&event, 0, sizeof(event));
  30. while (poll_cnt < MAX_POLL_CHUNK_SIZE) {
  31. aeqe = get_next_valid_eqe(&dev->aeq);
  32. if (!aeqe)
  33. break;
  34. dma_rmb();
  35. dev->aeq.ci++;
  36. atomic64_inc(&dev->aeq.event_num);
  37. poll_cnt++;
  38. if (FIELD_GET(ERDMA_AEQE_HDR_TYPE_MASK,
  39. le32_to_cpu(aeqe->hdr)) == ERDMA_AE_TYPE_CQ_ERR) {
  40. cqn = le32_to_cpu(aeqe->event_data0);
  41. cq = find_cq_by_cqn(dev, cqn);
  42. if (!cq)
  43. continue;
  44. event.device = cq->ibcq.device;
  45. event.element.cq = &cq->ibcq;
  46. event.event = IB_EVENT_CQ_ERR;
  47. if (cq->ibcq.event_handler)
  48. cq->ibcq.event_handler(&event,
  49. cq->ibcq.cq_context);
  50. } else {
  51. qpn = le32_to_cpu(aeqe->event_data0);
  52. qp = find_qp_by_qpn(dev, qpn);
  53. if (!qp)
  54. continue;
  55. event.device = qp->ibqp.device;
  56. event.element.qp = &qp->ibqp;
  57. event.event = IB_EVENT_QP_FATAL;
  58. if (qp->ibqp.event_handler)
  59. qp->ibqp.event_handler(&event,
  60. qp->ibqp.qp_context);
  61. }
  62. }
  63. notify_eq(&dev->aeq);
  64. }
  65. int erdma_aeq_init(struct erdma_dev *dev)
  66. {
  67. struct erdma_eq *eq = &dev->aeq;
  68. u32 buf_size;
  69. eq->depth = ERDMA_DEFAULT_EQ_DEPTH;
  70. buf_size = eq->depth << EQE_SHIFT;
  71. eq->qbuf =
  72. dma_alloc_coherent(&dev->pdev->dev, WARPPED_BUFSIZE(buf_size),
  73. &eq->qbuf_dma_addr, GFP_KERNEL | __GFP_ZERO);
  74. if (!eq->qbuf)
  75. return -ENOMEM;
  76. spin_lock_init(&eq->lock);
  77. atomic64_set(&eq->event_num, 0);
  78. atomic64_set(&eq->notify_num, 0);
  79. eq->db_addr = (u64 __iomem *)(dev->func_bar + ERDMA_REGS_AEQ_DB_REG);
  80. eq->db_record = (u64 *)(eq->qbuf + buf_size);
  81. erdma_reg_write32(dev, ERDMA_REGS_AEQ_ADDR_H_REG,
  82. upper_32_bits(eq->qbuf_dma_addr));
  83. erdma_reg_write32(dev, ERDMA_REGS_AEQ_ADDR_L_REG,
  84. lower_32_bits(eq->qbuf_dma_addr));
  85. erdma_reg_write32(dev, ERDMA_REGS_AEQ_DEPTH_REG, eq->depth);
  86. erdma_reg_write64(dev, ERDMA_AEQ_DB_HOST_ADDR_REG,
  87. eq->qbuf_dma_addr + buf_size);
  88. return 0;
  89. }
  90. void erdma_aeq_destroy(struct erdma_dev *dev)
  91. {
  92. struct erdma_eq *eq = &dev->aeq;
  93. dma_free_coherent(&dev->pdev->dev,
  94. WARPPED_BUFSIZE(eq->depth << EQE_SHIFT), eq->qbuf,
  95. eq->qbuf_dma_addr);
  96. }
  97. void erdma_ceq_completion_handler(struct erdma_eq_cb *ceq_cb)
  98. {
  99. struct erdma_dev *dev = ceq_cb->dev;
  100. struct erdma_cq *cq;
  101. u32 poll_cnt = 0;
  102. u64 *ceqe;
  103. int cqn;
  104. if (!ceq_cb->ready)
  105. return;
  106. while (poll_cnt < MAX_POLL_CHUNK_SIZE) {
  107. ceqe = get_next_valid_eqe(&ceq_cb->eq);
  108. if (!ceqe)
  109. break;
  110. dma_rmb();
  111. ceq_cb->eq.ci++;
  112. poll_cnt++;
  113. cqn = FIELD_GET(ERDMA_CEQE_HDR_CQN_MASK, READ_ONCE(*ceqe));
  114. cq = find_cq_by_cqn(dev, cqn);
  115. if (!cq)
  116. continue;
  117. if (rdma_is_kernel_res(&cq->ibcq.res))
  118. cq->kern_cq.cmdsn++;
  119. if (cq->ibcq.comp_handler)
  120. cq->ibcq.comp_handler(&cq->ibcq, cq->ibcq.cq_context);
  121. }
  122. notify_eq(&ceq_cb->eq);
  123. }
  124. static irqreturn_t erdma_intr_ceq_handler(int irq, void *data)
  125. {
  126. struct erdma_eq_cb *ceq_cb = data;
  127. tasklet_schedule(&ceq_cb->tasklet);
  128. return IRQ_HANDLED;
  129. }
  130. static void erdma_intr_ceq_task(unsigned long data)
  131. {
  132. erdma_ceq_completion_handler((struct erdma_eq_cb *)data);
  133. }
  134. static int erdma_set_ceq_irq(struct erdma_dev *dev, u16 ceqn)
  135. {
  136. struct erdma_eq_cb *eqc = &dev->ceqs[ceqn];
  137. int err;
  138. snprintf(eqc->irq.name, ERDMA_IRQNAME_SIZE, "erdma-ceq%u@pci:%s", ceqn,
  139. pci_name(dev->pdev));
  140. eqc->irq.msix_vector = pci_irq_vector(dev->pdev, ceqn + 1);
  141. tasklet_init(&dev->ceqs[ceqn].tasklet, erdma_intr_ceq_task,
  142. (unsigned long)&dev->ceqs[ceqn]);
  143. cpumask_set_cpu(cpumask_local_spread(ceqn + 1, dev->attrs.numa_node),
  144. &eqc->irq.affinity_hint_mask);
  145. err = request_irq(eqc->irq.msix_vector, erdma_intr_ceq_handler, 0,
  146. eqc->irq.name, eqc);
  147. if (err) {
  148. dev_err(&dev->pdev->dev, "failed to request_irq(%d)\n", err);
  149. return err;
  150. }
  151. irq_set_affinity_hint(eqc->irq.msix_vector,
  152. &eqc->irq.affinity_hint_mask);
  153. return 0;
  154. }
  155. static void erdma_free_ceq_irq(struct erdma_dev *dev, u16 ceqn)
  156. {
  157. struct erdma_eq_cb *eqc = &dev->ceqs[ceqn];
  158. irq_set_affinity_hint(eqc->irq.msix_vector, NULL);
  159. free_irq(eqc->irq.msix_vector, eqc);
  160. }
  161. static int create_eq_cmd(struct erdma_dev *dev, u32 eqn, struct erdma_eq *eq)
  162. {
  163. struct erdma_cmdq_create_eq_req req;
  164. dma_addr_t db_info_dma_addr;
  165. erdma_cmdq_build_reqhdr(&req.hdr, CMDQ_SUBMOD_COMMON,
  166. CMDQ_OPCODE_CREATE_EQ);
  167. req.eqn = eqn;
  168. req.depth = ilog2(eq->depth);
  169. req.qbuf_addr = eq->qbuf_dma_addr;
  170. req.qtype = ERDMA_EQ_TYPE_CEQ;
  171. /* Vector index is the same as EQN. */
  172. req.vector_idx = eqn;
  173. db_info_dma_addr = eq->qbuf_dma_addr + (eq->depth << EQE_SHIFT);
  174. req.db_dma_addr_l = lower_32_bits(db_info_dma_addr);
  175. req.db_dma_addr_h = upper_32_bits(db_info_dma_addr);
  176. return erdma_post_cmd_wait(&dev->cmdq, &req, sizeof(req), NULL, NULL);
  177. }
  178. static int erdma_ceq_init_one(struct erdma_dev *dev, u16 ceqn)
  179. {
  180. struct erdma_eq *eq = &dev->ceqs[ceqn].eq;
  181. u32 buf_size = ERDMA_DEFAULT_EQ_DEPTH << EQE_SHIFT;
  182. int ret;
  183. eq->qbuf =
  184. dma_alloc_coherent(&dev->pdev->dev, WARPPED_BUFSIZE(buf_size),
  185. &eq->qbuf_dma_addr, GFP_KERNEL | __GFP_ZERO);
  186. if (!eq->qbuf)
  187. return -ENOMEM;
  188. spin_lock_init(&eq->lock);
  189. atomic64_set(&eq->event_num, 0);
  190. atomic64_set(&eq->notify_num, 0);
  191. eq->depth = ERDMA_DEFAULT_EQ_DEPTH;
  192. eq->db_addr =
  193. (u64 __iomem *)(dev->func_bar + ERDMA_REGS_CEQ_DB_BASE_REG +
  194. (ceqn + 1) * ERDMA_DB_SIZE);
  195. eq->db_record = (u64 *)(eq->qbuf + buf_size);
  196. eq->ci = 0;
  197. dev->ceqs[ceqn].dev = dev;
  198. /* CEQ indexed from 1, 0 rsvd for CMDQ-EQ. */
  199. ret = create_eq_cmd(dev, ceqn + 1, eq);
  200. dev->ceqs[ceqn].ready = ret ? false : true;
  201. return ret;
  202. }
  203. static void erdma_ceq_uninit_one(struct erdma_dev *dev, u16 ceqn)
  204. {
  205. struct erdma_eq *eq = &dev->ceqs[ceqn].eq;
  206. u32 buf_size = ERDMA_DEFAULT_EQ_DEPTH << EQE_SHIFT;
  207. struct erdma_cmdq_destroy_eq_req req;
  208. int err;
  209. dev->ceqs[ceqn].ready = 0;
  210. erdma_cmdq_build_reqhdr(&req.hdr, CMDQ_SUBMOD_COMMON,
  211. CMDQ_OPCODE_DESTROY_EQ);
  212. /* CEQ indexed from 1, 0 rsvd for CMDQ-EQ. */
  213. req.eqn = ceqn + 1;
  214. req.qtype = ERDMA_EQ_TYPE_CEQ;
  215. req.vector_idx = ceqn + 1;
  216. err = erdma_post_cmd_wait(&dev->cmdq, &req, sizeof(req), NULL, NULL);
  217. if (err)
  218. return;
  219. dma_free_coherent(&dev->pdev->dev, WARPPED_BUFSIZE(buf_size), eq->qbuf,
  220. eq->qbuf_dma_addr);
  221. }
  222. int erdma_ceqs_init(struct erdma_dev *dev)
  223. {
  224. u32 i, j;
  225. int err;
  226. for (i = 0; i < dev->attrs.irq_num - 1; i++) {
  227. err = erdma_ceq_init_one(dev, i);
  228. if (err)
  229. goto out_err;
  230. err = erdma_set_ceq_irq(dev, i);
  231. if (err) {
  232. erdma_ceq_uninit_one(dev, i);
  233. goto out_err;
  234. }
  235. }
  236. return 0;
  237. out_err:
  238. for (j = 0; j < i; j++) {
  239. erdma_free_ceq_irq(dev, j);
  240. erdma_ceq_uninit_one(dev, j);
  241. }
  242. return err;
  243. }
  244. void erdma_ceqs_uninit(struct erdma_dev *dev)
  245. {
  246. u32 i;
  247. for (i = 0; i < dev->attrs.irq_num - 1; i++) {
  248. erdma_free_ceq_irq(dev, i);
  249. erdma_ceq_uninit_one(dev, i);
  250. }
  251. }