qib.h 49 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493
  1. #ifndef _QIB_KERNEL_H
  2. #define _QIB_KERNEL_H
  3. /*
  4. * Copyright (c) 2012 - 2017 Intel Corporation. All rights reserved.
  5. * Copyright (c) 2006 - 2012 QLogic Corporation. All rights reserved.
  6. * Copyright (c) 2003, 2004, 2005, 2006 PathScale, Inc. All rights reserved.
  7. *
  8. * This software is available to you under a choice of one of two
  9. * licenses. You may choose to be licensed under the terms of the GNU
  10. * General Public License (GPL) Version 2, available from the file
  11. * COPYING in the main directory of this source tree, or the
  12. * OpenIB.org BSD license below:
  13. *
  14. * Redistribution and use in source and binary forms, with or
  15. * without modification, are permitted provided that the following
  16. * conditions are met:
  17. *
  18. * - Redistributions of source code must retain the above
  19. * copyright notice, this list of conditions and the following
  20. * disclaimer.
  21. *
  22. * - Redistributions in binary form must reproduce the above
  23. * copyright notice, this list of conditions and the following
  24. * disclaimer in the documentation and/or other materials
  25. * provided with the distribution.
  26. *
  27. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  28. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  29. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  30. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  31. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  32. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  33. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  34. * SOFTWARE.
  35. */
  36. /*
  37. * This header file is the base header file for qlogic_ib kernel code
  38. * qib_user.h serves a similar purpose for user code.
  39. */
  40. #include <linux/interrupt.h>
  41. #include <linux/pci.h>
  42. #include <linux/dma-mapping.h>
  43. #include <linux/mutex.h>
  44. #include <linux/list.h>
  45. #include <linux/scatterlist.h>
  46. #include <linux/slab.h>
  47. #include <linux/io.h>
  48. #include <linux/fs.h>
  49. #include <linux/completion.h>
  50. #include <linux/kref.h>
  51. #include <linux/sched.h>
  52. #include <linux/kthread.h>
  53. #include <linux/xarray.h>
  54. #include <rdma/ib_hdrs.h>
  55. #include <rdma/rdma_vt.h>
  56. #include "qib_common.h"
  57. #include "qib_verbs.h"
  58. /* only s/w major version of QLogic_IB we can handle */
  59. #define QIB_CHIP_VERS_MAJ 2U
  60. /* don't care about this except printing */
  61. #define QIB_CHIP_VERS_MIN 0U
  62. /* The Organization Unique Identifier (Mfg code), and its position in GUID */
  63. #define QIB_OUI 0x001175
  64. #define QIB_OUI_LSB 40
  65. /*
  66. * per driver stats, either not device nor port-specific, or
  67. * summed over all of the devices and ports.
  68. * They are described by name via ipathfs filesystem, so layout
  69. * and number of elements can change without breaking compatibility.
  70. * If members are added or deleted qib_statnames[] in qib_fs.c must
  71. * change to match.
  72. */
  73. struct qlogic_ib_stats {
  74. __u64 sps_ints; /* number of interrupts handled */
  75. __u64 sps_errints; /* number of error interrupts */
  76. __u64 sps_txerrs; /* tx-related packet errors */
  77. __u64 sps_rcverrs; /* non-crc rcv packet errors */
  78. __u64 sps_hwerrs; /* hardware errors reported (parity, etc.) */
  79. __u64 sps_nopiobufs; /* no pio bufs avail from kernel */
  80. __u64 sps_ctxts; /* number of contexts currently open */
  81. __u64 sps_lenerrs; /* number of kernel packets where RHF != LRH len */
  82. __u64 sps_buffull;
  83. __u64 sps_hdrfull;
  84. };
  85. extern struct qlogic_ib_stats qib_stats;
  86. extern const struct pci_error_handlers qib_pci_err_handler;
  87. #define QIB_CHIP_SWVERSION QIB_CHIP_VERS_MAJ
  88. /*
  89. * First-cut critierion for "device is active" is
  90. * two thousand dwords combined Tx, Rx traffic per
  91. * 5-second interval. SMA packets are 64 dwords,
  92. * and occur "a few per second", presumably each way.
  93. */
  94. #define QIB_TRAFFIC_ACTIVE_THRESHOLD (2000)
  95. /*
  96. * Below contains all data related to a single context (formerly called port).
  97. */
  98. #ifdef CONFIG_DEBUG_FS
  99. struct qib_opcode_stats_perctx;
  100. #endif
  101. struct qib_ctxtdata {
  102. void **rcvegrbuf;
  103. dma_addr_t *rcvegrbuf_phys;
  104. /* rcvhdrq base, needs mmap before useful */
  105. void *rcvhdrq;
  106. /* kernel virtual address where hdrqtail is updated */
  107. void *rcvhdrtail_kvaddr;
  108. /*
  109. * temp buffer for expected send setup, allocated at open, instead
  110. * of each setup call
  111. */
  112. void *tid_pg_list;
  113. /*
  114. * Shared page for kernel to signal user processes that send buffers
  115. * need disarming. The process should call QIB_CMD_DISARM_BUFS
  116. * or QIB_CMD_ACK_EVENT with IPATH_EVENT_DISARM_BUFS set.
  117. */
  118. unsigned long *user_event_mask;
  119. /* when waiting for rcv or pioavail */
  120. wait_queue_head_t wait;
  121. /*
  122. * rcvegr bufs base, physical, must fit
  123. * in 44 bits so 32 bit programs mmap64 44 bit works)
  124. */
  125. dma_addr_t rcvegr_phys;
  126. /* mmap of hdrq, must fit in 44 bits */
  127. dma_addr_t rcvhdrq_phys;
  128. dma_addr_t rcvhdrqtailaddr_phys;
  129. /*
  130. * number of opens (including slave sub-contexts) on this instance
  131. * (ignoring forks, dup, etc. for now)
  132. */
  133. int cnt;
  134. /*
  135. * how much space to leave at start of eager TID entries for
  136. * protocol use, on each TID
  137. */
  138. /* instead of calculating it */
  139. unsigned ctxt;
  140. /* local node of context */
  141. int node_id;
  142. /* non-zero if ctxt is being shared. */
  143. u16 subctxt_cnt;
  144. /* non-zero if ctxt is being shared. */
  145. u16 subctxt_id;
  146. /* number of eager TID entries. */
  147. u16 rcvegrcnt;
  148. /* index of first eager TID entry. */
  149. u16 rcvegr_tid_base;
  150. /* number of pio bufs for this ctxt (all procs, if shared) */
  151. u32 piocnt;
  152. /* first pio buffer for this ctxt */
  153. u32 pio_base;
  154. /* chip offset of PIO buffers for this ctxt */
  155. u32 piobufs;
  156. /* how many alloc_pages() chunks in rcvegrbuf_pages */
  157. u32 rcvegrbuf_chunks;
  158. /* how many egrbufs per chunk */
  159. u16 rcvegrbufs_perchunk;
  160. /* ilog2 of above */
  161. u16 rcvegrbufs_perchunk_shift;
  162. /* order for rcvegrbuf_pages */
  163. size_t rcvegrbuf_size;
  164. /* rcvhdrq size (for freeing) */
  165. size_t rcvhdrq_size;
  166. /* per-context flags for fileops/intr communication */
  167. unsigned long flag;
  168. /* next expected TID to check when looking for free */
  169. u32 tidcursor;
  170. /* WAIT_RCV that timed out, no interrupt */
  171. u32 rcvwait_to;
  172. /* WAIT_PIO that timed out, no interrupt */
  173. u32 piowait_to;
  174. /* WAIT_RCV already happened, no wait */
  175. u32 rcvnowait;
  176. /* WAIT_PIO already happened, no wait */
  177. u32 pionowait;
  178. /* total number of polled urgent packets */
  179. u32 urgent;
  180. /* saved total number of polled urgent packets for poll edge trigger */
  181. u32 urgent_poll;
  182. /* pid of process using this ctxt */
  183. pid_t pid;
  184. pid_t subpid[QLOGIC_IB_MAX_SUBCTXT];
  185. /* same size as task_struct .comm[], command that opened context */
  186. char comm[TASK_COMM_LEN];
  187. /* pkeys set by this use of this ctxt */
  188. u16 pkeys[4];
  189. /* so file ops can get at unit */
  190. struct qib_devdata *dd;
  191. /* so funcs that need physical port can get it easily */
  192. struct qib_pportdata *ppd;
  193. /* A page of memory for rcvhdrhead, rcvegrhead, rcvegrtail * N */
  194. void *subctxt_uregbase;
  195. /* An array of pages for the eager receive buffers * N */
  196. void *subctxt_rcvegrbuf;
  197. /* An array of pages for the eager header queue entries * N */
  198. void *subctxt_rcvhdr_base;
  199. /* The version of the library which opened this ctxt */
  200. u32 userversion;
  201. /* Bitmask of active slaves */
  202. u32 active_slaves;
  203. /* Type of packets or conditions we want to poll for */
  204. u16 poll_type;
  205. /* receive packet sequence counter */
  206. u8 seq_cnt;
  207. u8 redirect_seq_cnt;
  208. /* ctxt rcvhdrq head offset */
  209. u32 head;
  210. /* QPs waiting for context processing */
  211. struct list_head qp_wait_list;
  212. #ifdef CONFIG_DEBUG_FS
  213. /* verbs stats per CTX */
  214. struct qib_opcode_stats_perctx *opstats;
  215. #endif
  216. };
  217. struct rvt_sge_state;
  218. struct qib_sdma_txreq {
  219. int flags;
  220. int sg_count;
  221. dma_addr_t addr;
  222. void (*callback)(struct qib_sdma_txreq *, int);
  223. u16 start_idx; /* sdma private */
  224. u16 next_descq_idx; /* sdma private */
  225. struct list_head list; /* sdma private */
  226. };
  227. struct qib_sdma_desc {
  228. __le64 qw[2];
  229. };
  230. struct qib_verbs_txreq {
  231. struct qib_sdma_txreq txreq;
  232. struct rvt_qp *qp;
  233. struct rvt_swqe *wqe;
  234. u32 dwords;
  235. u16 hdr_dwords;
  236. u16 hdr_inx;
  237. struct qib_pio_header *align_buf;
  238. struct rvt_mregion *mr;
  239. struct rvt_sge_state *ss;
  240. };
  241. #define QIB_SDMA_TXREQ_F_USELARGEBUF 0x1
  242. #define QIB_SDMA_TXREQ_F_HEADTOHOST 0x2
  243. #define QIB_SDMA_TXREQ_F_INTREQ 0x4
  244. #define QIB_SDMA_TXREQ_F_FREEBUF 0x8
  245. #define QIB_SDMA_TXREQ_F_FREEDESC 0x10
  246. #define QIB_SDMA_TXREQ_S_OK 0
  247. #define QIB_SDMA_TXREQ_S_SENDERROR 1
  248. #define QIB_SDMA_TXREQ_S_ABORTED 2
  249. #define QIB_SDMA_TXREQ_S_SHUTDOWN 3
  250. /*
  251. * Get/Set IB link-level config parameters for f_get/set_ib_cfg()
  252. * Mostly for MADs that set or query link parameters, also ipath
  253. * config interfaces
  254. */
  255. #define QIB_IB_CFG_LIDLMC 0 /* LID (LS16b) and Mask (MS16b) */
  256. #define QIB_IB_CFG_LWID_ENB 2 /* allowed Link-width */
  257. #define QIB_IB_CFG_LWID 3 /* currently active Link-width */
  258. #define QIB_IB_CFG_SPD_ENB 4 /* allowed Link speeds */
  259. #define QIB_IB_CFG_SPD 5 /* current Link spd */
  260. #define QIB_IB_CFG_RXPOL_ENB 6 /* Auto-RX-polarity enable */
  261. #define QIB_IB_CFG_LREV_ENB 7 /* Auto-Lane-reversal enable */
  262. #define QIB_IB_CFG_LINKLATENCY 8 /* Link Latency (IB1.2 only) */
  263. #define QIB_IB_CFG_HRTBT 9 /* IB heartbeat off/enable/auto; DDR/QDR only */
  264. #define QIB_IB_CFG_OP_VLS 10 /* operational VLs */
  265. #define QIB_IB_CFG_VL_HIGH_CAP 11 /* num of VL high priority weights */
  266. #define QIB_IB_CFG_VL_LOW_CAP 12 /* num of VL low priority weights */
  267. #define QIB_IB_CFG_OVERRUN_THRESH 13 /* IB overrun threshold */
  268. #define QIB_IB_CFG_PHYERR_THRESH 14 /* IB PHY error threshold */
  269. #define QIB_IB_CFG_LINKDEFAULT 15 /* IB link default (sleep/poll) */
  270. #define QIB_IB_CFG_PKEYS 16 /* update partition keys */
  271. #define QIB_IB_CFG_MTU 17 /* update MTU in IBC */
  272. #define QIB_IB_CFG_LSTATE 18 /* update linkcmd and linkinitcmd in IBC */
  273. #define QIB_IB_CFG_VL_HIGH_LIMIT 19
  274. #define QIB_IB_CFG_PMA_TICKS 20 /* PMA sample tick resolution */
  275. #define QIB_IB_CFG_PORT 21 /* switch port we are connected to */
  276. /*
  277. * for CFG_LSTATE: LINKCMD in upper 16 bits, LINKINITCMD in lower 16
  278. * IB_LINKINITCMD_POLL and SLEEP are also used as set/get values for
  279. * QIB_IB_CFG_LINKDEFAULT cmd
  280. */
  281. #define IB_LINKCMD_DOWN (0 << 16)
  282. #define IB_LINKCMD_ARMED (1 << 16)
  283. #define IB_LINKCMD_ACTIVE (2 << 16)
  284. #define IB_LINKINITCMD_NOP 0
  285. #define IB_LINKINITCMD_POLL 1
  286. #define IB_LINKINITCMD_SLEEP 2
  287. #define IB_LINKINITCMD_DISABLE 3
  288. /*
  289. * valid states passed to qib_set_linkstate() user call
  290. */
  291. #define QIB_IB_LINKDOWN 0
  292. #define QIB_IB_LINKARM 1
  293. #define QIB_IB_LINKACTIVE 2
  294. #define QIB_IB_LINKDOWN_ONLY 3
  295. #define QIB_IB_LINKDOWN_SLEEP 4
  296. #define QIB_IB_LINKDOWN_DISABLE 5
  297. /*
  298. * These 7 values (SDR, DDR, and QDR may be ORed for auto-speed
  299. * negotiation) are used for the 3rd argument to path_f_set_ib_cfg
  300. * with cmd QIB_IB_CFG_SPD_ENB, by direct calls or via sysfs. They
  301. * are also the possible values for qib_link_speed_enabled and active
  302. * The values were chosen to match values used within the IB spec.
  303. */
  304. #define QIB_IB_SDR 1
  305. #define QIB_IB_DDR 2
  306. #define QIB_IB_QDR 4
  307. #define QIB_DEFAULT_MTU 4096
  308. /* max number of IB ports supported per HCA */
  309. #define QIB_MAX_IB_PORTS 2
  310. /*
  311. * Possible IB config parameters for f_get/set_ib_table()
  312. */
  313. #define QIB_IB_TBL_VL_HIGH_ARB 1 /* Get/set VL high priority weights */
  314. #define QIB_IB_TBL_VL_LOW_ARB 2 /* Get/set VL low priority weights */
  315. /*
  316. * Possible "operations" for f_rcvctrl(ppd, op, ctxt)
  317. * these are bits so they can be combined, e.g.
  318. * QIB_RCVCTRL_INTRAVAIL_ENB | QIB_RCVCTRL_CTXT_ENB
  319. */
  320. #define QIB_RCVCTRL_TAILUPD_ENB 0x01
  321. #define QIB_RCVCTRL_TAILUPD_DIS 0x02
  322. #define QIB_RCVCTRL_CTXT_ENB 0x04
  323. #define QIB_RCVCTRL_CTXT_DIS 0x08
  324. #define QIB_RCVCTRL_INTRAVAIL_ENB 0x10
  325. #define QIB_RCVCTRL_INTRAVAIL_DIS 0x20
  326. #define QIB_RCVCTRL_PKEY_ENB 0x40 /* Note, default is enabled */
  327. #define QIB_RCVCTRL_PKEY_DIS 0x80
  328. #define QIB_RCVCTRL_BP_ENB 0x0100
  329. #define QIB_RCVCTRL_BP_DIS 0x0200
  330. #define QIB_RCVCTRL_TIDFLOW_ENB 0x0400
  331. #define QIB_RCVCTRL_TIDFLOW_DIS 0x0800
  332. /*
  333. * Possible "operations" for f_sendctrl(ppd, op, var)
  334. * these are bits so they can be combined, e.g.
  335. * QIB_SENDCTRL_BUFAVAIL_ENB | QIB_SENDCTRL_ENB
  336. * Some operations (e.g. DISARM, ABORT) are known to
  337. * be "one-shot", so do not modify shadow.
  338. */
  339. #define QIB_SENDCTRL_DISARM (0x1000)
  340. #define QIB_SENDCTRL_DISARM_BUF(bufn) ((bufn) | QIB_SENDCTRL_DISARM)
  341. /* available (0x2000) */
  342. #define QIB_SENDCTRL_AVAIL_DIS (0x4000)
  343. #define QIB_SENDCTRL_AVAIL_ENB (0x8000)
  344. #define QIB_SENDCTRL_AVAIL_BLIP (0x10000)
  345. #define QIB_SENDCTRL_SEND_DIS (0x20000)
  346. #define QIB_SENDCTRL_SEND_ENB (0x40000)
  347. #define QIB_SENDCTRL_FLUSH (0x80000)
  348. #define QIB_SENDCTRL_CLEAR (0x100000)
  349. #define QIB_SENDCTRL_DISARM_ALL (0x200000)
  350. /*
  351. * These are the generic indices for requesting per-port
  352. * counter values via the f_portcntr function. They
  353. * are always returned as 64 bit values, although most
  354. * are 32 bit counters.
  355. */
  356. /* send-related counters */
  357. #define QIBPORTCNTR_PKTSEND 0U
  358. #define QIBPORTCNTR_WORDSEND 1U
  359. #define QIBPORTCNTR_PSXMITDATA 2U
  360. #define QIBPORTCNTR_PSXMITPKTS 3U
  361. #define QIBPORTCNTR_PSXMITWAIT 4U
  362. #define QIBPORTCNTR_SENDSTALL 5U
  363. /* receive-related counters */
  364. #define QIBPORTCNTR_PKTRCV 6U
  365. #define QIBPORTCNTR_PSRCVDATA 7U
  366. #define QIBPORTCNTR_PSRCVPKTS 8U
  367. #define QIBPORTCNTR_RCVEBP 9U
  368. #define QIBPORTCNTR_RCVOVFL 10U
  369. #define QIBPORTCNTR_WORDRCV 11U
  370. /* IB link related error counters */
  371. #define QIBPORTCNTR_RXLOCALPHYERR 12U
  372. #define QIBPORTCNTR_RXVLERR 13U
  373. #define QIBPORTCNTR_ERRICRC 14U
  374. #define QIBPORTCNTR_ERRVCRC 15U
  375. #define QIBPORTCNTR_ERRLPCRC 16U
  376. #define QIBPORTCNTR_BADFORMAT 17U
  377. #define QIBPORTCNTR_ERR_RLEN 18U
  378. #define QIBPORTCNTR_IBSYMBOLERR 19U
  379. #define QIBPORTCNTR_INVALIDRLEN 20U
  380. #define QIBPORTCNTR_UNSUPVL 21U
  381. #define QIBPORTCNTR_EXCESSBUFOVFL 22U
  382. #define QIBPORTCNTR_ERRLINK 23U
  383. #define QIBPORTCNTR_IBLINKDOWN 24U
  384. #define QIBPORTCNTR_IBLINKERRRECOV 25U
  385. #define QIBPORTCNTR_LLI 26U
  386. /* other error counters */
  387. #define QIBPORTCNTR_RXDROPPKT 27U
  388. #define QIBPORTCNTR_VL15PKTDROP 28U
  389. #define QIBPORTCNTR_ERRPKEY 29U
  390. #define QIBPORTCNTR_KHDROVFL 30U
  391. /* sampling counters (these are actually control registers) */
  392. #define QIBPORTCNTR_PSINTERVAL 31U
  393. #define QIBPORTCNTR_PSSTART 32U
  394. #define QIBPORTCNTR_PSSTAT 33U
  395. /* how often we check for packet activity for "power on hours (in seconds) */
  396. #define ACTIVITY_TIMER 5
  397. #define MAX_NAME_SIZE 64
  398. #ifdef CONFIG_INFINIBAND_QIB_DCA
  399. struct qib_irq_notify;
  400. #endif
  401. struct qib_msix_entry {
  402. void *arg;
  403. #ifdef CONFIG_INFINIBAND_QIB_DCA
  404. int dca;
  405. int rcv;
  406. struct qib_irq_notify *notifier;
  407. #endif
  408. cpumask_var_t mask;
  409. };
  410. /* Below is an opaque struct. Each chip (device) can maintain
  411. * private data needed for its operation, but not germane to the
  412. * rest of the driver. For convenience, we define another that
  413. * is chip-specific, per-port
  414. */
  415. struct qib_chip_specific;
  416. struct qib_chipport_specific;
  417. enum qib_sdma_states {
  418. qib_sdma_state_s00_hw_down,
  419. qib_sdma_state_s10_hw_start_up_wait,
  420. qib_sdma_state_s20_idle,
  421. qib_sdma_state_s30_sw_clean_up_wait,
  422. qib_sdma_state_s40_hw_clean_up_wait,
  423. qib_sdma_state_s50_hw_halt_wait,
  424. qib_sdma_state_s99_running,
  425. };
  426. enum qib_sdma_events {
  427. qib_sdma_event_e00_go_hw_down,
  428. qib_sdma_event_e10_go_hw_start,
  429. qib_sdma_event_e20_hw_started,
  430. qib_sdma_event_e30_go_running,
  431. qib_sdma_event_e40_sw_cleaned,
  432. qib_sdma_event_e50_hw_cleaned,
  433. qib_sdma_event_e60_hw_halted,
  434. qib_sdma_event_e70_go_idle,
  435. qib_sdma_event_e7220_err_halted,
  436. qib_sdma_event_e7322_err_halted,
  437. qib_sdma_event_e90_timer_tick,
  438. };
  439. struct sdma_set_state_action {
  440. unsigned op_enable:1;
  441. unsigned op_intenable:1;
  442. unsigned op_halt:1;
  443. unsigned op_drain:1;
  444. unsigned go_s99_running_tofalse:1;
  445. unsigned go_s99_running_totrue:1;
  446. };
  447. struct qib_sdma_state {
  448. struct kref kref;
  449. struct completion comp;
  450. enum qib_sdma_states current_state;
  451. struct sdma_set_state_action *set_state_action;
  452. unsigned current_op;
  453. unsigned go_s99_running;
  454. unsigned first_sendbuf;
  455. unsigned last_sendbuf; /* really last +1 */
  456. /* debugging/devel */
  457. enum qib_sdma_states previous_state;
  458. unsigned previous_op;
  459. enum qib_sdma_events last_event;
  460. };
  461. struct xmit_wait {
  462. struct timer_list timer;
  463. u64 counter;
  464. u8 flags;
  465. struct cache {
  466. u64 psxmitdata;
  467. u64 psrcvdata;
  468. u64 psxmitpkts;
  469. u64 psrcvpkts;
  470. u64 psxmitwait;
  471. } counter_cache;
  472. };
  473. /*
  474. * The structure below encapsulates data relevant to a physical IB Port.
  475. * Current chips support only one such port, but the separation
  476. * clarifies things a bit. Note that to conform to IB conventions,
  477. * port-numbers are one-based. The first or only port is port1.
  478. */
  479. struct qib_pportdata {
  480. struct qib_ibport ibport_data;
  481. struct qib_devdata *dd;
  482. struct qib_chippport_specific *cpspec; /* chip-specific per-port */
  483. /* GUID for this interface, in network order */
  484. __be64 guid;
  485. /* QIB_POLL, etc. link-state specific flags, per port */
  486. u32 lflags;
  487. /* qib_lflags driver is waiting for */
  488. u32 state_wanted;
  489. spinlock_t lflags_lock;
  490. /* ref count for each pkey */
  491. atomic_t pkeyrefs[4];
  492. /*
  493. * this address is mapped readonly into user processes so they can
  494. * get status cheaply, whenever they want. One qword of status per port
  495. */
  496. u64 *statusp;
  497. /* SendDMA related entries */
  498. /* read mostly */
  499. struct qib_sdma_desc *sdma_descq;
  500. struct workqueue_struct *qib_wq;
  501. struct qib_sdma_state sdma_state;
  502. dma_addr_t sdma_descq_phys;
  503. volatile __le64 *sdma_head_dma; /* DMA'ed by chip */
  504. dma_addr_t sdma_head_phys;
  505. u16 sdma_descq_cnt;
  506. /* read/write using lock */
  507. spinlock_t sdma_lock ____cacheline_aligned_in_smp;
  508. struct list_head sdma_activelist;
  509. struct list_head sdma_userpending;
  510. u64 sdma_descq_added;
  511. u64 sdma_descq_removed;
  512. u16 sdma_descq_tail;
  513. u16 sdma_descq_head;
  514. u8 sdma_generation;
  515. u8 sdma_intrequest;
  516. struct tasklet_struct sdma_sw_clean_up_task
  517. ____cacheline_aligned_in_smp;
  518. wait_queue_head_t state_wait; /* for state_wanted */
  519. /* HoL blocking for SMP replies */
  520. unsigned hol_state;
  521. struct timer_list hol_timer;
  522. /*
  523. * Shadow copies of registers; size indicates read access size.
  524. * Most of them are readonly, but some are write-only register,
  525. * where we manipulate the bits in the shadow copy, and then write
  526. * the shadow copy to qlogic_ib.
  527. *
  528. * We deliberately make most of these 32 bits, since they have
  529. * restricted range. For any that we read, we won't to generate 32
  530. * bit accesses, since Opteron will generate 2 separate 32 bit HT
  531. * transactions for a 64 bit read, and we want to avoid unnecessary
  532. * bus transactions.
  533. */
  534. /* This is the 64 bit group */
  535. /* last ibcstatus. opaque outside chip-specific code */
  536. u64 lastibcstat;
  537. /* these are the "32 bit" regs */
  538. /*
  539. * the following two are 32-bit bitmasks, but {test,clear,set}_bit
  540. * all expect bit fields to be "unsigned long"
  541. */
  542. unsigned long p_rcvctrl; /* shadow per-port rcvctrl */
  543. unsigned long p_sendctrl; /* shadow per-port sendctrl */
  544. u32 ibmtu; /* The MTU programmed for this unit */
  545. /*
  546. * Current max size IB packet (in bytes) including IB headers, that
  547. * we can send. Changes when ibmtu changes.
  548. */
  549. u32 ibmaxlen;
  550. /*
  551. * ibmaxlen at init time, limited by chip and by receive buffer
  552. * size. Not changed after init.
  553. */
  554. u32 init_ibmaxlen;
  555. /* LID programmed for this instance */
  556. u16 lid;
  557. /* list of pkeys programmed; 0 if not set */
  558. u16 pkeys[4];
  559. /* LID mask control */
  560. u8 lmc;
  561. u8 link_width_supported;
  562. u16 link_speed_supported;
  563. u8 link_width_enabled;
  564. u16 link_speed_enabled;
  565. u8 link_width_active;
  566. u16 link_speed_active;
  567. u8 vls_supported;
  568. u8 vls_operational;
  569. /* Rx Polarity inversion (compensate for ~tx on partner) */
  570. u8 rx_pol_inv;
  571. u8 hw_pidx; /* physical port index */
  572. u32 port; /* IB port number and index into dd->pports - 1 */
  573. u8 delay_mult;
  574. /* used to override LED behavior */
  575. u8 led_override; /* Substituted for normal value, if non-zero */
  576. u16 led_override_timeoff; /* delta to next timer event */
  577. u8 led_override_vals[2]; /* Alternates per blink-frame */
  578. u8 led_override_phase; /* Just counts, LSB picks from vals[] */
  579. atomic_t led_override_timer_active;
  580. /* Used to flash LEDs in override mode */
  581. struct timer_list led_override_timer;
  582. struct xmit_wait cong_stats;
  583. struct timer_list symerr_clear_timer;
  584. /* Synchronize access between driver writes and sysfs reads */
  585. spinlock_t cc_shadow_lock
  586. ____cacheline_aligned_in_smp;
  587. /* Shadow copy of the congestion control table */
  588. struct cc_table_shadow *ccti_entries_shadow;
  589. /* Shadow copy of the congestion control entries */
  590. struct ib_cc_congestion_setting_attr_shadow *congestion_entries_shadow;
  591. /* List of congestion control table entries */
  592. struct ib_cc_table_entry_shadow *ccti_entries;
  593. /* 16 congestion entries with each entry corresponding to a SL */
  594. struct ib_cc_congestion_entry_shadow *congestion_entries;
  595. /* Maximum number of congestion control entries that the agent expects
  596. * the manager to send.
  597. */
  598. u16 cc_supported_table_entries;
  599. /* Total number of congestion control table entries */
  600. u16 total_cct_entry;
  601. /* Bit map identifying service level */
  602. u16 cc_sl_control_map;
  603. /* maximum congestion control table index */
  604. u16 ccti_limit;
  605. /* CA's max number of 64 entry units in the congestion control table */
  606. u8 cc_max_table_entries;
  607. };
  608. /* Observers. Not to be taken lightly, possibly not to ship. */
  609. /*
  610. * If a diag read or write is to (bottom <= offset <= top),
  611. * the "hook" is called, allowing, e.g. shadows to be
  612. * updated in sync with the driver. struct diag_observer
  613. * is the "visible" part.
  614. */
  615. struct diag_observer;
  616. typedef int (*diag_hook) (struct qib_devdata *dd,
  617. const struct diag_observer *op,
  618. u32 offs, u64 *data, u64 mask, int only_32);
  619. struct diag_observer {
  620. diag_hook hook;
  621. u32 bottom;
  622. u32 top;
  623. };
  624. extern int qib_register_observer(struct qib_devdata *dd,
  625. const struct diag_observer *op);
  626. /* Only declared here, not defined. Private to diags */
  627. struct diag_observer_list_elt;
  628. /* device data struct now contains only "general per-device" info.
  629. * fields related to a physical IB port are in a qib_pportdata struct,
  630. * described above) while fields only used by a particular chip-type are in
  631. * a qib_chipdata struct, whose contents are opaque to this file.
  632. */
  633. struct qib_devdata {
  634. struct qib_ibdev verbs_dev; /* must be first */
  635. struct list_head list;
  636. /* pointers to related structs for this device */
  637. /* pci access data structure */
  638. struct pci_dev *pcidev;
  639. struct cdev *user_cdev;
  640. struct cdev *diag_cdev;
  641. struct device *user_device;
  642. struct device *diag_device;
  643. /* mem-mapped pointer to base of chip regs */
  644. u64 __iomem *kregbase;
  645. /* end of mem-mapped chip space excluding sendbuf and user regs */
  646. u64 __iomem *kregend;
  647. /* physical address of chip for io_remap, etc. */
  648. resource_size_t physaddr;
  649. /* qib_cfgctxts pointers */
  650. struct qib_ctxtdata **rcd; /* Receive Context Data */
  651. /* qib_pportdata, points to array of (physical) port-specific
  652. * data structs, indexed by pidx (0..n-1)
  653. */
  654. struct qib_pportdata *pport;
  655. struct qib_chip_specific *cspec; /* chip-specific */
  656. /* kvirt address of 1st 2k pio buffer */
  657. void __iomem *pio2kbase;
  658. /* kvirt address of 1st 4k pio buffer */
  659. void __iomem *pio4kbase;
  660. /* mem-mapped pointer to base of PIO buffers (if using WC PAT) */
  661. void __iomem *piobase;
  662. /* mem-mapped pointer to base of user chip regs (if using WC PAT) */
  663. u64 __iomem *userbase;
  664. void __iomem *piovl15base; /* base of VL15 buffers, if not WC */
  665. /*
  666. * points to area where PIOavail registers will be DMA'ed.
  667. * Has to be on a page of it's own, because the page will be
  668. * mapped into user program space. This copy is *ONLY* ever
  669. * written by DMA, not by the driver! Need a copy per device
  670. * when we get to multiple devices
  671. */
  672. volatile __le64 *pioavailregs_dma; /* DMA'ed by chip */
  673. /* physical address where updates occur */
  674. dma_addr_t pioavailregs_phys;
  675. /* device-specific implementations of functions needed by
  676. * common code. Contrary to previous consensus, we can't
  677. * really just point to a device-specific table, because we
  678. * may need to "bend", e.g. *_f_put_tid
  679. */
  680. /* fallback to alternate interrupt type if possible */
  681. int (*f_intr_fallback)(struct qib_devdata *);
  682. /* hard reset chip */
  683. int (*f_reset)(struct qib_devdata *);
  684. void (*f_quiet_serdes)(struct qib_pportdata *);
  685. int (*f_bringup_serdes)(struct qib_pportdata *);
  686. int (*f_early_init)(struct qib_devdata *);
  687. void (*f_clear_tids)(struct qib_devdata *, struct qib_ctxtdata *);
  688. void (*f_put_tid)(struct qib_devdata *, u64 __iomem*,
  689. u32, unsigned long);
  690. void (*f_cleanup)(struct qib_devdata *);
  691. void (*f_setextled)(struct qib_pportdata *, u32);
  692. /* fill out chip-specific fields */
  693. int (*f_get_base_info)(struct qib_ctxtdata *, struct qib_base_info *);
  694. /* free irq */
  695. void (*f_free_irq)(struct qib_devdata *);
  696. struct qib_message_header *(*f_get_msgheader)
  697. (struct qib_devdata *, __le32 *);
  698. void (*f_config_ctxts)(struct qib_devdata *);
  699. int (*f_get_ib_cfg)(struct qib_pportdata *, int);
  700. int (*f_set_ib_cfg)(struct qib_pportdata *, int, u32);
  701. int (*f_set_ib_loopback)(struct qib_pportdata *, const char *);
  702. int (*f_get_ib_table)(struct qib_pportdata *, int, void *);
  703. int (*f_set_ib_table)(struct qib_pportdata *, int, void *);
  704. u32 (*f_iblink_state)(u64);
  705. u8 (*f_ibphys_portstate)(u64);
  706. void (*f_xgxs_reset)(struct qib_pportdata *);
  707. /* per chip actions needed for IB Link up/down changes */
  708. int (*f_ib_updown)(struct qib_pportdata *, int, u64);
  709. u32 __iomem *(*f_getsendbuf)(struct qib_pportdata *, u64, u32 *);
  710. /* Read/modify/write of GPIO pins (potentially chip-specific */
  711. int (*f_gpio_mod)(struct qib_devdata *dd, u32 out, u32 dir,
  712. u32 mask);
  713. /* Enable writes to config EEPROM (if supported) */
  714. int (*f_eeprom_wen)(struct qib_devdata *dd, int wen);
  715. /*
  716. * modify rcvctrl shadow[s] and write to appropriate chip-regs.
  717. * see above QIB_RCVCTRL_xxx_ENB/DIS for operations.
  718. * (ctxt == -1) means "all contexts", only meaningful for
  719. * clearing. Could remove if chip_spec shutdown properly done.
  720. */
  721. void (*f_rcvctrl)(struct qib_pportdata *, unsigned int op,
  722. int ctxt);
  723. /* Read/modify/write sendctrl appropriately for op and port. */
  724. void (*f_sendctrl)(struct qib_pportdata *, u32 op);
  725. void (*f_set_intr_state)(struct qib_devdata *, u32);
  726. void (*f_set_armlaunch)(struct qib_devdata *, u32);
  727. void (*f_wantpiobuf_intr)(struct qib_devdata *, u32);
  728. int (*f_late_initreg)(struct qib_devdata *);
  729. int (*f_init_sdma_regs)(struct qib_pportdata *);
  730. u16 (*f_sdma_gethead)(struct qib_pportdata *);
  731. int (*f_sdma_busy)(struct qib_pportdata *);
  732. void (*f_sdma_update_tail)(struct qib_pportdata *, u16);
  733. void (*f_sdma_set_desc_cnt)(struct qib_pportdata *, unsigned);
  734. void (*f_sdma_sendctrl)(struct qib_pportdata *, unsigned);
  735. void (*f_sdma_hw_clean_up)(struct qib_pportdata *);
  736. void (*f_sdma_hw_start_up)(struct qib_pportdata *);
  737. void (*f_sdma_init_early)(struct qib_pportdata *);
  738. void (*f_set_cntr_sample)(struct qib_pportdata *, u32, u32);
  739. void (*f_update_usrhead)(struct qib_ctxtdata *, u64, u32, u32, u32);
  740. u32 (*f_hdrqempty)(struct qib_ctxtdata *);
  741. u64 (*f_portcntr)(struct qib_pportdata *, u32);
  742. u32 (*f_read_cntrs)(struct qib_devdata *, loff_t, char **,
  743. u64 **);
  744. u32 (*f_read_portcntrs)(struct qib_devdata *, loff_t, u32,
  745. char **, u64 **);
  746. u32 (*f_setpbc_control)(struct qib_pportdata *, u32, u8, u8);
  747. void (*f_initvl15_bufs)(struct qib_devdata *);
  748. void (*f_init_ctxt)(struct qib_ctxtdata *);
  749. void (*f_txchk_change)(struct qib_devdata *, u32, u32, u32,
  750. struct qib_ctxtdata *);
  751. void (*f_writescratch)(struct qib_devdata *, u32);
  752. int (*f_tempsense_rd)(struct qib_devdata *, int regnum);
  753. #ifdef CONFIG_INFINIBAND_QIB_DCA
  754. int (*f_notify_dca)(struct qib_devdata *, unsigned long event);
  755. #endif
  756. char *boardname; /* human readable board info */
  757. /* template for writing TIDs */
  758. u64 tidtemplate;
  759. /* value to write to free TIDs */
  760. u64 tidinvalid;
  761. /* number of registers used for pioavail */
  762. u32 pioavregs;
  763. /* device (not port) flags, basically device capabilities */
  764. u32 flags;
  765. /* last buffer for user use */
  766. u32 lastctxt_piobuf;
  767. /* reset value */
  768. u64 z_int_counter;
  769. /* percpu intcounter */
  770. u64 __percpu *int_counter;
  771. /* pio bufs allocated per ctxt */
  772. u32 pbufsctxt;
  773. /* if remainder on bufs/ctxt, ctxts < extrabuf get 1 extra */
  774. u32 ctxts_extrabuf;
  775. /*
  776. * number of ctxts configured as max; zero is set to number chip
  777. * supports, less gives more pio bufs/ctxt, etc.
  778. */
  779. u32 cfgctxts;
  780. /*
  781. * number of ctxts available for PSM open
  782. */
  783. u32 freectxts;
  784. /*
  785. * hint that we should update pioavailshadow before
  786. * looking for a PIO buffer
  787. */
  788. u32 upd_pio_shadow;
  789. /* internal debugging stats */
  790. u32 maxpkts_call;
  791. u32 avgpkts_call;
  792. u64 nopiobufs;
  793. /* PCI Vendor ID (here for NodeInfo) */
  794. u16 vendorid;
  795. /* PCI Device ID (here for NodeInfo) */
  796. u16 deviceid;
  797. /* for write combining settings */
  798. int wc_cookie;
  799. unsigned long wc_base;
  800. unsigned long wc_len;
  801. /* shadow copy of struct page *'s for exp tid pages */
  802. struct page **pageshadow;
  803. /* shadow copy of dma handles for exp tid pages */
  804. dma_addr_t *physshadow;
  805. u64 __iomem *egrtidbase;
  806. spinlock_t sendctrl_lock; /* protect changes to sendctrl shadow */
  807. /* around rcd and (user ctxts) ctxt_cnt use (intr vs free) */
  808. spinlock_t uctxt_lock; /* rcd and user context changes */
  809. /*
  810. * per unit status, see also portdata statusp
  811. * mapped readonly into user processes so they can get unit and
  812. * IB link status cheaply
  813. */
  814. u64 *devstatusp;
  815. char *freezemsg; /* freeze msg if hw error put chip in freeze */
  816. u32 freezelen; /* max length of freezemsg */
  817. /* timer used to prevent stats overflow, error throttling, etc. */
  818. struct timer_list stats_timer;
  819. /* timer to verify interrupts work, and fallback if possible */
  820. struct timer_list intrchk_timer;
  821. unsigned long ureg_align; /* user register alignment */
  822. /*
  823. * Protects pioavailshadow, pioavailkernel, pio_need_disarm, and
  824. * pio_writing.
  825. */
  826. spinlock_t pioavail_lock;
  827. /*
  828. * index of last buffer to optimize search for next
  829. */
  830. u32 last_pio;
  831. /*
  832. * min kernel pio buffer to optimize search
  833. */
  834. u32 min_kernel_pio;
  835. /*
  836. * Shadow copies of registers; size indicates read access size.
  837. * Most of them are readonly, but some are write-only register,
  838. * where we manipulate the bits in the shadow copy, and then write
  839. * the shadow copy to qlogic_ib.
  840. *
  841. * We deliberately make most of these 32 bits, since they have
  842. * restricted range. For any that we read, we won't to generate 32
  843. * bit accesses, since Opteron will generate 2 separate 32 bit HT
  844. * transactions for a 64 bit read, and we want to avoid unnecessary
  845. * bus transactions.
  846. */
  847. /* This is the 64 bit group */
  848. unsigned long pioavailshadow[6];
  849. /* bitmap of send buffers available for the kernel to use with PIO. */
  850. unsigned long pioavailkernel[6];
  851. /* bitmap of send buffers which need to be disarmed. */
  852. unsigned long pio_need_disarm[3];
  853. /* bitmap of send buffers which are being written to. */
  854. unsigned long pio_writing[3];
  855. /* kr_revision shadow */
  856. u64 revision;
  857. /* Base GUID for device (from eeprom, network order) */
  858. __be64 base_guid;
  859. /*
  860. * kr_sendpiobufbase value (chip offset of pio buffers), and the
  861. * base of the 2KB buffer s(user processes only use 2K)
  862. */
  863. u64 piobufbase;
  864. u32 pio2k_bufbase;
  865. /* these are the "32 bit" regs */
  866. /* number of GUIDs in the flash for this interface */
  867. u32 nguid;
  868. /*
  869. * the following two are 32-bit bitmasks, but {test,clear,set}_bit
  870. * all expect bit fields to be "unsigned long"
  871. */
  872. unsigned long rcvctrl; /* shadow per device rcvctrl */
  873. unsigned long sendctrl; /* shadow per device sendctrl */
  874. /* value we put in kr_rcvhdrcnt */
  875. u32 rcvhdrcnt;
  876. /* value we put in kr_rcvhdrsize */
  877. u32 rcvhdrsize;
  878. /* value we put in kr_rcvhdrentsize */
  879. u32 rcvhdrentsize;
  880. /* kr_ctxtcnt value */
  881. u32 ctxtcnt;
  882. /* kr_pagealign value */
  883. u32 palign;
  884. /* number of "2KB" PIO buffers */
  885. u32 piobcnt2k;
  886. /* size in bytes of "2KB" PIO buffers */
  887. u32 piosize2k;
  888. /* max usable size in dwords of a "2KB" PIO buffer before going "4KB" */
  889. u32 piosize2kmax_dwords;
  890. /* number of "4KB" PIO buffers */
  891. u32 piobcnt4k;
  892. /* size in bytes of "4KB" PIO buffers */
  893. u32 piosize4k;
  894. /* kr_rcvegrbase value */
  895. u32 rcvegrbase;
  896. /* kr_rcvtidbase value */
  897. u32 rcvtidbase;
  898. /* kr_rcvtidcnt value */
  899. u32 rcvtidcnt;
  900. /* kr_userregbase */
  901. u32 uregbase;
  902. /* shadow the control register contents */
  903. u32 control;
  904. /* chip address space used by 4k pio buffers */
  905. u32 align4k;
  906. /* size of each rcvegrbuffer */
  907. u16 rcvegrbufsize;
  908. /* log2 of above */
  909. u16 rcvegrbufsize_shift;
  910. /* localbus width (1, 2,4,8,16,32) from config space */
  911. u32 lbus_width;
  912. /* localbus speed in MHz */
  913. u32 lbus_speed;
  914. int unit; /* unit # of this chip */
  915. /* start of CHIP_SPEC move to chipspec, but need code changes */
  916. /* low and high portions of MSI capability/vector */
  917. u32 msi_lo;
  918. /* saved after PCIe init for restore after reset */
  919. u32 msi_hi;
  920. /* MSI data (vector) saved for restore */
  921. u16 msi_data;
  922. /* so we can rewrite it after a chip reset */
  923. u32 pcibar0;
  924. /* so we can rewrite it after a chip reset */
  925. u32 pcibar1;
  926. u64 rhdrhead_intr_off;
  927. /*
  928. * ASCII serial number, from flash, large enough for original
  929. * all digit strings, and longer QLogic serial number format
  930. */
  931. u8 serial[16];
  932. /* human readable board version */
  933. u8 boardversion[96];
  934. u8 lbus_info[32]; /* human readable localbus info */
  935. /* chip major rev, from qib_revision */
  936. u8 majrev;
  937. /* chip minor rev, from qib_revision */
  938. u8 minrev;
  939. /* Misc small ints */
  940. /* Number of physical ports available */
  941. u8 num_pports;
  942. /* Lowest context number which can be used by user processes */
  943. u8 first_user_ctxt;
  944. u8 n_krcv_queues;
  945. u8 qpn_mask;
  946. u8 skip_kctxt_mask;
  947. u16 rhf_offset; /* offset of RHF within receive header entry */
  948. /*
  949. * GPIO pins for twsi-connected devices, and device code for eeprom
  950. */
  951. u8 gpio_sda_num;
  952. u8 gpio_scl_num;
  953. u8 twsi_eeprom_dev;
  954. u8 board_atten;
  955. /* Support (including locks) for EEPROM logging of errors and time */
  956. /* control access to actual counters, timer */
  957. spinlock_t eep_st_lock;
  958. /* control high-level access to EEPROM */
  959. struct mutex eep_lock;
  960. uint64_t traffic_wds;
  961. struct qib_diag_client *diag_client;
  962. spinlock_t qib_diag_trans_lock; /* protect diag observer ops */
  963. struct diag_observer_list_elt *diag_observer_list;
  964. u8 psxmitwait_supported;
  965. /* cycle length of PS* counters in HW (in picoseconds) */
  966. u16 psxmitwait_check_rate;
  967. /* high volume overflow errors defered to tasklet */
  968. struct tasklet_struct error_tasklet;
  969. int assigned_node_id; /* NUMA node closest to HCA */
  970. };
  971. /* hol_state values */
  972. #define QIB_HOL_UP 0
  973. #define QIB_HOL_INIT 1
  974. #define QIB_SDMA_SENDCTRL_OP_ENABLE (1U << 0)
  975. #define QIB_SDMA_SENDCTRL_OP_INTENABLE (1U << 1)
  976. #define QIB_SDMA_SENDCTRL_OP_HALT (1U << 2)
  977. #define QIB_SDMA_SENDCTRL_OP_CLEANUP (1U << 3)
  978. #define QIB_SDMA_SENDCTRL_OP_DRAIN (1U << 4)
  979. /* operation types for f_txchk_change() */
  980. #define TXCHK_CHG_TYPE_DIS1 3
  981. #define TXCHK_CHG_TYPE_ENAB1 2
  982. #define TXCHK_CHG_TYPE_KERN 1
  983. #define TXCHK_CHG_TYPE_USER 0
  984. #define QIB_CHASE_TIME msecs_to_jiffies(145)
  985. #define QIB_CHASE_DIS_TIME msecs_to_jiffies(160)
  986. /* Private data for file operations */
  987. struct qib_filedata {
  988. struct qib_ctxtdata *rcd;
  989. unsigned subctxt;
  990. unsigned tidcursor;
  991. struct qib_user_sdma_queue *pq;
  992. int rec_cpu_num; /* for cpu affinity; -1 if none */
  993. };
  994. extern struct xarray qib_dev_table;
  995. extern struct qib_devdata *qib_lookup(int unit);
  996. extern u32 qib_cpulist_count;
  997. extern unsigned long *qib_cpulist;
  998. extern unsigned qib_cc_table_size;
  999. int qib_init(struct qib_devdata *, int);
  1000. int init_chip_wc_pat(struct qib_devdata *dd, u32);
  1001. int qib_enable_wc(struct qib_devdata *dd);
  1002. void qib_disable_wc(struct qib_devdata *dd);
  1003. int qib_count_units(int *npresentp, int *nupp);
  1004. int qib_count_active_units(void);
  1005. int qib_cdev_init(int minor, const char *name,
  1006. const struct file_operations *fops,
  1007. struct cdev **cdevp, struct device **devp);
  1008. void qib_cdev_cleanup(struct cdev **cdevp, struct device **devp);
  1009. int qib_dev_init(void);
  1010. void qib_dev_cleanup(void);
  1011. int qib_diag_add(struct qib_devdata *);
  1012. void qib_diag_remove(struct qib_devdata *);
  1013. void qib_handle_e_ibstatuschanged(struct qib_pportdata *, u64);
  1014. void qib_sdma_update_tail(struct qib_pportdata *, u16); /* hold sdma_lock */
  1015. int qib_decode_err(struct qib_devdata *dd, char *buf, size_t blen, u64 err);
  1016. void qib_bad_intrstatus(struct qib_devdata *);
  1017. void qib_handle_urcv(struct qib_devdata *, u64);
  1018. /* clean up any per-chip chip-specific stuff */
  1019. void qib_chip_cleanup(struct qib_devdata *);
  1020. /* clean up any chip type-specific stuff */
  1021. void qib_chip_done(void);
  1022. /* check to see if we have to force ordering for write combining */
  1023. int qib_unordered_wc(void);
  1024. void qib_pio_copy(void __iomem *to, const void *from, size_t count);
  1025. void qib_disarm_piobufs(struct qib_devdata *, unsigned, unsigned);
  1026. int qib_disarm_piobufs_ifneeded(struct qib_ctxtdata *);
  1027. void qib_disarm_piobufs_set(struct qib_devdata *, unsigned long *, unsigned);
  1028. void qib_cancel_sends(struct qib_pportdata *);
  1029. int qib_create_rcvhdrq(struct qib_devdata *, struct qib_ctxtdata *);
  1030. int qib_setup_eagerbufs(struct qib_ctxtdata *);
  1031. void qib_set_ctxtcnt(struct qib_devdata *);
  1032. int qib_create_ctxts(struct qib_devdata *dd);
  1033. struct qib_ctxtdata *qib_create_ctxtdata(struct qib_pportdata *, u32, int);
  1034. int qib_init_pportdata(struct qib_pportdata *, struct qib_devdata *, u8, u8);
  1035. void qib_free_ctxtdata(struct qib_devdata *, struct qib_ctxtdata *);
  1036. u32 qib_kreceive(struct qib_ctxtdata *, u32 *, u32 *);
  1037. int qib_reset_device(int);
  1038. int qib_wait_linkstate(struct qib_pportdata *, u32, int);
  1039. int qib_set_linkstate(struct qib_pportdata *, u8);
  1040. int qib_set_mtu(struct qib_pportdata *, u16);
  1041. int qib_set_lid(struct qib_pportdata *, u32, u8);
  1042. void qib_hol_down(struct qib_pportdata *);
  1043. void qib_hol_init(struct qib_pportdata *);
  1044. void qib_hol_up(struct qib_pportdata *);
  1045. void qib_hol_event(struct timer_list *);
  1046. void qib_disable_after_error(struct qib_devdata *);
  1047. int qib_set_uevent_bits(struct qib_pportdata *, const int);
  1048. /* for use in system calls, where we want to know device type, etc. */
  1049. #define ctxt_fp(fp) \
  1050. (((struct qib_filedata *)(fp)->private_data)->rcd)
  1051. #define subctxt_fp(fp) \
  1052. (((struct qib_filedata *)(fp)->private_data)->subctxt)
  1053. #define tidcursor_fp(fp) \
  1054. (((struct qib_filedata *)(fp)->private_data)->tidcursor)
  1055. #define user_sdma_queue_fp(fp) \
  1056. (((struct qib_filedata *)(fp)->private_data)->pq)
  1057. static inline struct qib_devdata *dd_from_ppd(struct qib_pportdata *ppd)
  1058. {
  1059. return ppd->dd;
  1060. }
  1061. static inline struct qib_devdata *dd_from_dev(struct qib_ibdev *dev)
  1062. {
  1063. return container_of(dev, struct qib_devdata, verbs_dev);
  1064. }
  1065. static inline struct qib_devdata *dd_from_ibdev(struct ib_device *ibdev)
  1066. {
  1067. return dd_from_dev(to_idev(ibdev));
  1068. }
  1069. static inline struct qib_pportdata *ppd_from_ibp(struct qib_ibport *ibp)
  1070. {
  1071. return container_of(ibp, struct qib_pportdata, ibport_data);
  1072. }
  1073. static inline struct qib_ibport *to_iport(struct ib_device *ibdev, u32 port)
  1074. {
  1075. struct qib_devdata *dd = dd_from_ibdev(ibdev);
  1076. u32 pidx = port - 1; /* IB number port from 1, hdw from 0 */
  1077. WARN_ON(pidx >= dd->num_pports);
  1078. return &dd->pport[pidx].ibport_data;
  1079. }
  1080. /*
  1081. * values for dd->flags (_device_ related flags) and
  1082. */
  1083. #define QIB_HAS_LINK_LATENCY 0x1 /* supports link latency (IB 1.2) */
  1084. #define QIB_INITTED 0x2 /* chip and driver up and initted */
  1085. #define QIB_DOING_RESET 0x4 /* in the middle of doing chip reset */
  1086. #define QIB_PRESENT 0x8 /* chip accesses can be done */
  1087. #define QIB_PIO_FLUSH_WC 0x10 /* Needs Write combining flush for PIO */
  1088. #define QIB_HAS_THRESH_UPDATE 0x40
  1089. #define QIB_HAS_SDMA_TIMEOUT 0x80
  1090. #define QIB_USE_SPCL_TRIG 0x100 /* SpecialTrigger launch enabled */
  1091. #define QIB_NODMA_RTAIL 0x200 /* rcvhdrtail register DMA enabled */
  1092. #define QIB_HAS_INTX 0x800 /* Supports INTx interrupts */
  1093. #define QIB_HAS_SEND_DMA 0x1000 /* Supports Send DMA */
  1094. #define QIB_HAS_VLSUPP 0x2000 /* Supports multiple VLs; PBC different */
  1095. #define QIB_HAS_HDRSUPP 0x4000 /* Supports header suppression */
  1096. #define QIB_BADINTR 0x8000 /* severe interrupt problems */
  1097. #define QIB_DCA_ENABLED 0x10000 /* Direct Cache Access enabled */
  1098. #define QIB_HAS_QSFP 0x20000 /* device (card instance) has QSFP */
  1099. #define QIB_SHUTDOWN 0x40000 /* device is shutting down */
  1100. /*
  1101. * values for ppd->lflags (_ib_port_ related flags)
  1102. */
  1103. #define QIBL_LINKV 0x1 /* IB link state valid */
  1104. #define QIBL_LINKDOWN 0x8 /* IB link is down */
  1105. #define QIBL_LINKINIT 0x10 /* IB link level is up */
  1106. #define QIBL_LINKARMED 0x20 /* IB link is ARMED */
  1107. #define QIBL_LINKACTIVE 0x40 /* IB link is ACTIVE */
  1108. /* leave a gap for more IB-link state */
  1109. #define QIBL_IB_AUTONEG_INPROG 0x1000 /* non-IBTA DDR/QDR neg active */
  1110. #define QIBL_IB_AUTONEG_FAILED 0x2000 /* non-IBTA DDR/QDR neg failed */
  1111. #define QIBL_IB_LINK_DISABLED 0x4000 /* Linkdown-disable forced,
  1112. * Do not try to bring up */
  1113. #define QIBL_IB_FORCE_NOTIFY 0x8000 /* force notify on next ib change */
  1114. /* IB dword length mask in PBC (lower 11 bits); same for all chips */
  1115. #define QIB_PBC_LENGTH_MASK ((1 << 11) - 1)
  1116. /* ctxt_flag bit offsets */
  1117. /* waiting for a packet to arrive */
  1118. #define QIB_CTXT_WAITING_RCV 2
  1119. /* master has not finished initializing */
  1120. #define QIB_CTXT_MASTER_UNINIT 4
  1121. /* waiting for an urgent packet to arrive */
  1122. #define QIB_CTXT_WAITING_URG 5
  1123. /* free up any allocated data at closes */
  1124. void qib_free_data(struct qib_ctxtdata *dd);
  1125. void qib_chg_pioavailkernel(struct qib_devdata *, unsigned, unsigned,
  1126. u32, struct qib_ctxtdata *);
  1127. struct qib_devdata *qib_init_iba7322_funcs(struct pci_dev *,
  1128. const struct pci_device_id *);
  1129. struct qib_devdata *qib_init_iba7220_funcs(struct pci_dev *,
  1130. const struct pci_device_id *);
  1131. struct qib_devdata *qib_init_iba6120_funcs(struct pci_dev *,
  1132. const struct pci_device_id *);
  1133. void qib_free_devdata(struct qib_devdata *);
  1134. struct qib_devdata *qib_alloc_devdata(struct pci_dev *pdev, size_t extra);
  1135. #define QIB_TWSI_NO_DEV 0xFF
  1136. /* Below qib_twsi_ functions must be called with eep_lock held */
  1137. int qib_twsi_reset(struct qib_devdata *dd);
  1138. int qib_twsi_blk_rd(struct qib_devdata *dd, int dev, int addr, void *buffer,
  1139. int len);
  1140. int qib_twsi_blk_wr(struct qib_devdata *dd, int dev, int addr,
  1141. const void *buffer, int len);
  1142. void qib_get_eeprom_info(struct qib_devdata *);
  1143. void qib_dump_lookup_output_queue(struct qib_devdata *);
  1144. void qib_force_pio_avail_update(struct qib_devdata *);
  1145. void qib_clear_symerror_on_linkup(struct timer_list *t);
  1146. /*
  1147. * Set LED override, only the two LSBs have "public" meaning, but
  1148. * any non-zero value substitutes them for the Link and LinkTrain
  1149. * LED states.
  1150. */
  1151. #define QIB_LED_PHYS 1 /* Physical (linktraining) GREEN LED */
  1152. #define QIB_LED_LOG 2 /* Logical (link) YELLOW LED */
  1153. void qib_set_led_override(struct qib_pportdata *ppd, unsigned int val);
  1154. /* send dma routines */
  1155. int qib_setup_sdma(struct qib_pportdata *);
  1156. void qib_teardown_sdma(struct qib_pportdata *);
  1157. void __qib_sdma_intr(struct qib_pportdata *);
  1158. void qib_sdma_intr(struct qib_pportdata *);
  1159. void qib_user_sdma_send_desc(struct qib_pportdata *dd,
  1160. struct list_head *pktlist);
  1161. int qib_sdma_verbs_send(struct qib_pportdata *, struct rvt_sge_state *,
  1162. u32, struct qib_verbs_txreq *);
  1163. /* ppd->sdma_lock should be locked before calling this. */
  1164. int qib_sdma_make_progress(struct qib_pportdata *dd);
  1165. /* must be called under qib_sdma_lock */
  1166. static inline u16 qib_sdma_descq_freecnt(const struct qib_pportdata *ppd)
  1167. {
  1168. return ppd->sdma_descq_cnt -
  1169. (ppd->sdma_descq_added - ppd->sdma_descq_removed) - 1;
  1170. }
  1171. static inline int __qib_sdma_running(struct qib_pportdata *ppd)
  1172. {
  1173. return ppd->sdma_state.current_state == qib_sdma_state_s99_running;
  1174. }
  1175. int qib_sdma_running(struct qib_pportdata *);
  1176. void dump_sdma_state(struct qib_pportdata *ppd);
  1177. void __qib_sdma_process_event(struct qib_pportdata *, enum qib_sdma_events);
  1178. void qib_sdma_process_event(struct qib_pportdata *, enum qib_sdma_events);
  1179. /*
  1180. * number of words used for protocol header if not set by qib_userinit();
  1181. */
  1182. #define QIB_DFLT_RCVHDRSIZE 9
  1183. /*
  1184. * We need to be able to handle an IB header of at least 24 dwords.
  1185. * We need the rcvhdrq large enough to handle largest IB header, but
  1186. * still have room for a 2KB MTU standard IB packet.
  1187. * Additionally, some processor/memory controller combinations
  1188. * benefit quite strongly from having the DMA'ed data be cacheline
  1189. * aligned and a cacheline multiple, so we set the size to 32 dwords
  1190. * (2 64-byte primary cachelines for pretty much all processors of
  1191. * interest). The alignment hurts nothing, other than using somewhat
  1192. * more memory.
  1193. */
  1194. #define QIB_RCVHDR_ENTSIZE 32
  1195. int qib_get_user_pages(unsigned long, size_t, struct page **);
  1196. void qib_release_user_pages(struct page **, size_t);
  1197. int qib_eeprom_read(struct qib_devdata *, u8, void *, int);
  1198. int qib_eeprom_write(struct qib_devdata *, u8, const void *, int);
  1199. u32 __iomem *qib_getsendbuf_range(struct qib_devdata *, u32 *, u32, u32);
  1200. void qib_sendbuf_done(struct qib_devdata *, unsigned);
  1201. static inline void qib_clear_rcvhdrtail(const struct qib_ctxtdata *rcd)
  1202. {
  1203. *((u64 *) rcd->rcvhdrtail_kvaddr) = 0ULL;
  1204. }
  1205. static inline u32 qib_get_rcvhdrtail(const struct qib_ctxtdata *rcd)
  1206. {
  1207. /*
  1208. * volatile because it's a DMA target from the chip, routine is
  1209. * inlined, and don't want register caching or reordering.
  1210. */
  1211. return (u32) le64_to_cpu(
  1212. *((volatile __le64 *)rcd->rcvhdrtail_kvaddr)); /* DMA'ed */
  1213. }
  1214. /*
  1215. * sysfs interface.
  1216. */
  1217. extern const char ib_qib_version[];
  1218. extern const struct attribute_group qib_attr_group;
  1219. extern const struct attribute_group *qib_attr_port_groups[];
  1220. int qib_device_create(struct qib_devdata *);
  1221. void qib_device_remove(struct qib_devdata *);
  1222. /* Hook for sysfs read of QSFP */
  1223. extern int qib_qsfp_dump(struct qib_pportdata *ppd, char *buf, int len);
  1224. int __init qib_init_qibfs(void);
  1225. int __exit qib_exit_qibfs(void);
  1226. int qibfs_add(struct qib_devdata *);
  1227. int qibfs_remove(struct qib_devdata *);
  1228. int qib_pcie_init(struct pci_dev *, const struct pci_device_id *);
  1229. int qib_pcie_ddinit(struct qib_devdata *, struct pci_dev *,
  1230. const struct pci_device_id *);
  1231. void qib_pcie_ddcleanup(struct qib_devdata *);
  1232. int qib_pcie_params(struct qib_devdata *dd, u32 minw, u32 *nent);
  1233. void qib_free_irq(struct qib_devdata *dd);
  1234. int qib_reinit_intr(struct qib_devdata *dd);
  1235. void qib_pcie_getcmd(struct qib_devdata *, u16 *, u8 *, u8 *);
  1236. void qib_pcie_reenable(struct qib_devdata *, u16, u8, u8);
  1237. /* interrupts for device */
  1238. u64 qib_int_counter(struct qib_devdata *);
  1239. /* interrupt for all devices */
  1240. u64 qib_sps_ints(void);
  1241. /*
  1242. * dma_addr wrappers - all 0's invalid for hw
  1243. */
  1244. int qib_map_page(struct pci_dev *d, struct page *p, dma_addr_t *daddr);
  1245. struct pci_dev *qib_get_pci_dev(struct rvt_dev_info *rdi);
  1246. /*
  1247. * Flush write combining store buffers (if present) and perform a write
  1248. * barrier.
  1249. */
  1250. static inline void qib_flush_wc(void)
  1251. {
  1252. #if defined(CONFIG_X86_64)
  1253. asm volatile("sfence" : : : "memory");
  1254. #else
  1255. wmb(); /* no reorder around wc flush */
  1256. #endif
  1257. }
  1258. /* global module parameter variables */
  1259. extern unsigned qib_ibmtu;
  1260. extern ushort qib_cfgctxts;
  1261. extern ushort qib_num_cfg_vls;
  1262. extern ushort qib_mini_init; /* If set, do few (ideally 0) writes to chip */
  1263. extern unsigned qib_n_krcv_queues;
  1264. extern unsigned qib_sdma_fetch_arb;
  1265. extern unsigned qib_compat_ddr_negotiate;
  1266. extern int qib_special_trigger;
  1267. extern unsigned qib_numa_aware;
  1268. extern struct mutex qib_mutex;
  1269. /* Number of seconds before our card status check... */
  1270. #define STATUS_TIMEOUT 60
  1271. #define QIB_DRV_NAME "ib_qib"
  1272. #define QIB_USER_MINOR_BASE 0
  1273. #define QIB_TRACE_MINOR 127
  1274. #define QIB_DIAGPKT_MINOR 128
  1275. #define QIB_DIAG_MINOR_BASE 129
  1276. #define QIB_NMINORS 255
  1277. #define PCI_VENDOR_ID_PATHSCALE 0x1fc1
  1278. #define PCI_VENDOR_ID_QLOGIC 0x1077
  1279. #define PCI_DEVICE_ID_QLOGIC_IB_6120 0x10
  1280. #define PCI_DEVICE_ID_QLOGIC_IB_7220 0x7220
  1281. #define PCI_DEVICE_ID_QLOGIC_IB_7322 0x7322
  1282. /*
  1283. * qib_early_err is used (only!) to print early errors before devdata is
  1284. * allocated, or when dd->pcidev may not be valid, and at the tail end of
  1285. * cleanup when devdata may have been freed, etc. qib_dev_porterr is
  1286. * the same as qib_dev_err, but is used when the message really needs
  1287. * the IB port# to be definitive as to what's happening..
  1288. * All of these go to the trace log, and the trace log entry is done
  1289. * first to avoid possible serial port delays from printk.
  1290. */
  1291. #define qib_early_err(dev, fmt, ...) \
  1292. dev_err(dev, fmt, ##__VA_ARGS__)
  1293. #define qib_dev_err(dd, fmt, ...) \
  1294. dev_err(&(dd)->pcidev->dev, "%s: " fmt, \
  1295. rvt_get_ibdev_name(&(dd)->verbs_dev.rdi), ##__VA_ARGS__)
  1296. #define qib_dev_warn(dd, fmt, ...) \
  1297. dev_warn(&(dd)->pcidev->dev, "%s: " fmt, \
  1298. rvt_get_ibdev_name(&(dd)->verbs_dev.rdi), ##__VA_ARGS__)
  1299. #define qib_dev_porterr(dd, port, fmt, ...) \
  1300. dev_err(&(dd)->pcidev->dev, "%s: IB%u:%u " fmt, \
  1301. rvt_get_ibdev_name(&(dd)->verbs_dev.rdi), (dd)->unit, (port), \
  1302. ##__VA_ARGS__)
  1303. #define qib_devinfo(pcidev, fmt, ...) \
  1304. dev_info(&(pcidev)->dev, fmt, ##__VA_ARGS__)
  1305. /*
  1306. * this is used for formatting hw error messages...
  1307. */
  1308. struct qib_hwerror_msgs {
  1309. u64 mask;
  1310. const char *msg;
  1311. size_t sz;
  1312. };
  1313. #define QLOGIC_IB_HWE_MSG(a, b) { .mask = a, .msg = b }
  1314. /* in qib_intr.c... */
  1315. void qib_format_hwerrors(u64 hwerrs,
  1316. const struct qib_hwerror_msgs *hwerrmsgs,
  1317. size_t nhwerrmsgs, char *msg, size_t lmsg);
  1318. void qib_stop_send_queue(struct rvt_qp *qp);
  1319. void qib_quiesce_qp(struct rvt_qp *qp);
  1320. void qib_flush_qp_waiters(struct rvt_qp *qp);
  1321. int qib_mtu_to_path_mtu(u32 mtu);
  1322. u32 qib_mtu_from_qp(struct rvt_dev_info *rdi, struct rvt_qp *qp, u32 pmtu);
  1323. void qib_notify_error_qp(struct rvt_qp *qp);
  1324. int qib_get_pmtu_from_attr(struct rvt_dev_info *rdi, struct rvt_qp *qp,
  1325. struct ib_qp_attr *attr);
  1326. #endif /* _QIB_KERNEL_H */