apple-dart.c 28 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Apple DART (Device Address Resolution Table) IOMMU driver
  4. *
  5. * Copyright (C) 2021 The Asahi Linux Contributors
  6. *
  7. * Based on arm/arm-smmu/arm-ssmu.c and arm/arm-smmu-v3/arm-smmu-v3.c
  8. * Copyright (C) 2013 ARM Limited
  9. * Copyright (C) 2015 ARM Limited
  10. * and on exynos-iommu.c
  11. * Copyright (c) 2011,2016 Samsung Electronics Co., Ltd.
  12. */
  13. #include <linux/atomic.h>
  14. #include <linux/bitfield.h>
  15. #include <linux/clk.h>
  16. #include <linux/dev_printk.h>
  17. #include <linux/dma-mapping.h>
  18. #include <linux/err.h>
  19. #include <linux/interrupt.h>
  20. #include <linux/io-pgtable.h>
  21. #include <linux/iommu.h>
  22. #include <linux/iopoll.h>
  23. #include <linux/module.h>
  24. #include <linux/of.h>
  25. #include <linux/of_address.h>
  26. #include <linux/of_iommu.h>
  27. #include <linux/of_platform.h>
  28. #include <linux/pci.h>
  29. #include <linux/platform_device.h>
  30. #include <linux/slab.h>
  31. #include <linux/swab.h>
  32. #include <linux/types.h>
  33. #include "dma-iommu.h"
  34. #define DART_MAX_STREAMS 256
  35. #define DART_MAX_TTBR 4
  36. #define MAX_DARTS_PER_DEVICE 2
  37. #define DART_PARAMS1 0x00
  38. #define DART_PARAMS_PAGE_SHIFT GENMASK(27, 24)
  39. #define DART_PARAMS2 0x04
  40. #define DART_PARAMS_BYPASS_SUPPORT BIT(0)
  41. #define DART_STREAM_COMMAND 0x20
  42. #define DART_STREAM_COMMAND_BUSY BIT(2)
  43. #define DART_STREAM_COMMAND_INVALIDATE BIT(20)
  44. #define DART_STREAM_SELECT 0x34
  45. #define DART_ERROR 0x40
  46. #define DART_ERROR_STREAM GENMASK(27, 24)
  47. #define DART_ERROR_CODE GENMASK(11, 0)
  48. #define DART_ERROR_FLAG BIT(31)
  49. #define DART_ERROR_READ_FAULT BIT(4)
  50. #define DART_ERROR_WRITE_FAULT BIT(3)
  51. #define DART_ERROR_NO_PTE BIT(2)
  52. #define DART_ERROR_NO_PMD BIT(1)
  53. #define DART_ERROR_NO_TTBR BIT(0)
  54. #define DART_CONFIG 0x60
  55. #define DART_CONFIG_LOCK BIT(15)
  56. #define DART_STREAM_COMMAND_BUSY_TIMEOUT 100
  57. #define DART_ERROR_ADDR_HI 0x54
  58. #define DART_ERROR_ADDR_LO 0x50
  59. #define DART_STREAMS_ENABLE 0xfc
  60. #define DART_TCR(sid) (0x100 + 4 * (sid))
  61. #define DART_TCR_TRANSLATE_ENABLE BIT(7)
  62. #define DART_TCR_BYPASS0_ENABLE BIT(8)
  63. #define DART_TCR_BYPASS1_ENABLE BIT(12)
  64. #define DART_TTBR(sid, idx) (0x200 + 16 * (sid) + 4 * (idx))
  65. #define DART_TTBR_VALID BIT(31)
  66. #define DART_TTBR_SHIFT 12
  67. struct apple_dart_hw {
  68. u32 oas;
  69. enum io_pgtable_fmt fmt;
  70. int max_sid_count;
  71. };
  72. /*
  73. * Private structure associated with each DART device.
  74. *
  75. * @dev: device struct
  76. * @hw: SoC-specific hardware data
  77. * @regs: mapped MMIO region
  78. * @irq: interrupt number, can be shared with other DARTs
  79. * @clks: clocks associated with this DART
  80. * @num_clks: number of @clks
  81. * @lock: lock for hardware operations involving this dart
  82. * @pgsize: pagesize supported by this DART
  83. * @supports_bypass: indicates if this DART supports bypass mode
  84. * @force_bypass: force bypass mode due to pagesize mismatch?
  85. * @sid2group: maps stream ids to iommu_groups
  86. * @iommu: iommu core device
  87. */
  88. struct apple_dart {
  89. struct device *dev;
  90. const struct apple_dart_hw *hw;
  91. void __iomem *regs;
  92. int irq;
  93. struct clk_bulk_data *clks;
  94. int num_clks;
  95. spinlock_t lock;
  96. u32 pgsize;
  97. u32 num_streams;
  98. u32 supports_bypass : 1;
  99. u32 force_bypass : 1;
  100. struct iommu_group *sid2group[DART_MAX_STREAMS];
  101. struct iommu_device iommu;
  102. u32 save_tcr[DART_MAX_STREAMS];
  103. u32 save_ttbr[DART_MAX_STREAMS][DART_MAX_TTBR];
  104. };
  105. /*
  106. * Convenience struct to identify streams.
  107. *
  108. * The normal variant is used inside apple_dart_master_cfg which isn't written
  109. * to concurrently.
  110. * The atomic variant is used inside apple_dart_domain where we have to guard
  111. * against races from potential parallel calls to attach/detach_device.
  112. * Note that even inside the atomic variant the apple_dart pointer is not
  113. * protected: This pointer is initialized once under the domain init mutex
  114. * and never changed again afterwards. Devices with different dart pointers
  115. * cannot be attached to the same domain.
  116. *
  117. * @dart dart pointer
  118. * @sid stream id bitmap
  119. */
  120. struct apple_dart_stream_map {
  121. struct apple_dart *dart;
  122. DECLARE_BITMAP(sidmap, DART_MAX_STREAMS);
  123. };
  124. struct apple_dart_atomic_stream_map {
  125. struct apple_dart *dart;
  126. atomic_long_t sidmap[BITS_TO_LONGS(DART_MAX_STREAMS)];
  127. };
  128. /*
  129. * This structure is attached to each iommu domain handled by a DART.
  130. *
  131. * @pgtbl_ops: pagetable ops allocated by io-pgtable
  132. * @finalized: true if the domain has been completely initialized
  133. * @init_lock: protects domain initialization
  134. * @stream_maps: streams attached to this domain (valid for DMA/UNMANAGED only)
  135. * @domain: core iommu domain pointer
  136. */
  137. struct apple_dart_domain {
  138. struct io_pgtable_ops *pgtbl_ops;
  139. bool finalized;
  140. struct mutex init_lock;
  141. struct apple_dart_atomic_stream_map stream_maps[MAX_DARTS_PER_DEVICE];
  142. struct iommu_domain domain;
  143. };
  144. /*
  145. * This structure is attached to devices with dev_iommu_priv_set() on of_xlate
  146. * and contains a list of streams bound to this device.
  147. * So far the worst case seen is a single device with two streams
  148. * from different darts, such that this simple static array is enough.
  149. *
  150. * @streams: streams for this device
  151. */
  152. struct apple_dart_master_cfg {
  153. struct apple_dart_stream_map stream_maps[MAX_DARTS_PER_DEVICE];
  154. };
  155. /*
  156. * Helper macro to iterate over apple_dart_master_cfg.stream_maps and
  157. * apple_dart_domain.stream_maps
  158. *
  159. * @i int used as loop variable
  160. * @base pointer to base struct (apple_dart_master_cfg or apple_dart_domain)
  161. * @stream pointer to the apple_dart_streams struct for each loop iteration
  162. */
  163. #define for_each_stream_map(i, base, stream_map) \
  164. for (i = 0, stream_map = &(base)->stream_maps[0]; \
  165. i < MAX_DARTS_PER_DEVICE && stream_map->dart; \
  166. stream_map = &(base)->stream_maps[++i])
  167. static struct platform_driver apple_dart_driver;
  168. static const struct iommu_ops apple_dart_iommu_ops;
  169. static struct apple_dart_domain *to_dart_domain(struct iommu_domain *dom)
  170. {
  171. return container_of(dom, struct apple_dart_domain, domain);
  172. }
  173. static void
  174. apple_dart_hw_enable_translation(struct apple_dart_stream_map *stream_map)
  175. {
  176. struct apple_dart *dart = stream_map->dart;
  177. int sid;
  178. for_each_set_bit(sid, stream_map->sidmap, dart->num_streams)
  179. writel(DART_TCR_TRANSLATE_ENABLE,
  180. dart->regs + DART_TCR(sid));
  181. }
  182. static void apple_dart_hw_disable_dma(struct apple_dart_stream_map *stream_map)
  183. {
  184. struct apple_dart *dart = stream_map->dart;
  185. int sid;
  186. for_each_set_bit(sid, stream_map->sidmap, dart->num_streams)
  187. writel(0, dart->regs + DART_TCR(sid));
  188. }
  189. static void
  190. apple_dart_hw_enable_bypass(struct apple_dart_stream_map *stream_map)
  191. {
  192. struct apple_dart *dart = stream_map->dart;
  193. int sid;
  194. WARN_ON(!stream_map->dart->supports_bypass);
  195. for_each_set_bit(sid, stream_map->sidmap, dart->num_streams)
  196. writel(DART_TCR_BYPASS0_ENABLE | DART_TCR_BYPASS1_ENABLE,
  197. dart->regs + DART_TCR(sid));
  198. }
  199. static void apple_dart_hw_set_ttbr(struct apple_dart_stream_map *stream_map,
  200. u8 idx, phys_addr_t paddr)
  201. {
  202. struct apple_dart *dart = stream_map->dart;
  203. int sid;
  204. WARN_ON(paddr & ((1 << DART_TTBR_SHIFT) - 1));
  205. for_each_set_bit(sid, stream_map->sidmap, dart->num_streams)
  206. writel(DART_TTBR_VALID | (paddr >> DART_TTBR_SHIFT),
  207. dart->regs + DART_TTBR(sid, idx));
  208. }
  209. static void apple_dart_hw_clear_ttbr(struct apple_dart_stream_map *stream_map,
  210. u8 idx)
  211. {
  212. struct apple_dart *dart = stream_map->dart;
  213. int sid;
  214. for_each_set_bit(sid, stream_map->sidmap, dart->num_streams)
  215. writel(0, dart->regs + DART_TTBR(sid, idx));
  216. }
  217. static void
  218. apple_dart_hw_clear_all_ttbrs(struct apple_dart_stream_map *stream_map)
  219. {
  220. int i;
  221. for (i = 0; i < DART_MAX_TTBR; ++i)
  222. apple_dart_hw_clear_ttbr(stream_map, i);
  223. }
  224. static int
  225. apple_dart_hw_stream_command(struct apple_dart_stream_map *stream_map,
  226. u32 command)
  227. {
  228. unsigned long flags;
  229. int ret;
  230. u32 command_reg;
  231. spin_lock_irqsave(&stream_map->dart->lock, flags);
  232. writel(stream_map->sidmap[0], stream_map->dart->regs + DART_STREAM_SELECT);
  233. writel(command, stream_map->dart->regs + DART_STREAM_COMMAND);
  234. ret = readl_poll_timeout_atomic(
  235. stream_map->dart->regs + DART_STREAM_COMMAND, command_reg,
  236. !(command_reg & DART_STREAM_COMMAND_BUSY), 1,
  237. DART_STREAM_COMMAND_BUSY_TIMEOUT);
  238. spin_unlock_irqrestore(&stream_map->dart->lock, flags);
  239. if (ret) {
  240. dev_err(stream_map->dart->dev,
  241. "busy bit did not clear after command %x for streams %lx\n",
  242. command, stream_map->sidmap[0]);
  243. return ret;
  244. }
  245. return 0;
  246. }
  247. static int
  248. apple_dart_hw_invalidate_tlb(struct apple_dart_stream_map *stream_map)
  249. {
  250. return apple_dart_hw_stream_command(stream_map,
  251. DART_STREAM_COMMAND_INVALIDATE);
  252. }
  253. static int apple_dart_hw_reset(struct apple_dart *dart)
  254. {
  255. u32 config;
  256. struct apple_dart_stream_map stream_map;
  257. int i;
  258. config = readl(dart->regs + DART_CONFIG);
  259. if (config & DART_CONFIG_LOCK) {
  260. dev_err(dart->dev, "DART is locked down until reboot: %08x\n",
  261. config);
  262. return -EINVAL;
  263. }
  264. stream_map.dart = dart;
  265. bitmap_zero(stream_map.sidmap, DART_MAX_STREAMS);
  266. bitmap_set(stream_map.sidmap, 0, dart->num_streams);
  267. apple_dart_hw_disable_dma(&stream_map);
  268. apple_dart_hw_clear_all_ttbrs(&stream_map);
  269. /* enable all streams globally since TCR is used to control isolation */
  270. for (i = 0; i < BITS_TO_U32(dart->num_streams); i++)
  271. writel(U32_MAX, dart->regs + DART_STREAMS_ENABLE + 4 * i);
  272. /* clear any pending errors before the interrupt is unmasked */
  273. writel(readl(dart->regs + DART_ERROR), dart->regs + DART_ERROR);
  274. return apple_dart_hw_invalidate_tlb(&stream_map);
  275. }
  276. static void apple_dart_domain_flush_tlb(struct apple_dart_domain *domain)
  277. {
  278. int i, j;
  279. struct apple_dart_atomic_stream_map *domain_stream_map;
  280. struct apple_dart_stream_map stream_map;
  281. for_each_stream_map(i, domain, domain_stream_map) {
  282. stream_map.dart = domain_stream_map->dart;
  283. for (j = 0; j < BITS_TO_LONGS(stream_map.dart->num_streams); j++)
  284. stream_map.sidmap[j] = atomic_long_read(&domain_stream_map->sidmap[j]);
  285. apple_dart_hw_invalidate_tlb(&stream_map);
  286. }
  287. }
  288. static void apple_dart_flush_iotlb_all(struct iommu_domain *domain)
  289. {
  290. apple_dart_domain_flush_tlb(to_dart_domain(domain));
  291. }
  292. static void apple_dart_iotlb_sync(struct iommu_domain *domain,
  293. struct iommu_iotlb_gather *gather)
  294. {
  295. apple_dart_domain_flush_tlb(to_dart_domain(domain));
  296. }
  297. static void apple_dart_iotlb_sync_map(struct iommu_domain *domain,
  298. unsigned long iova, size_t size)
  299. {
  300. apple_dart_domain_flush_tlb(to_dart_domain(domain));
  301. }
  302. static phys_addr_t apple_dart_iova_to_phys(struct iommu_domain *domain,
  303. dma_addr_t iova)
  304. {
  305. struct apple_dart_domain *dart_domain = to_dart_domain(domain);
  306. struct io_pgtable_ops *ops = dart_domain->pgtbl_ops;
  307. if (!ops)
  308. return 0;
  309. return ops->iova_to_phys(ops, iova);
  310. }
  311. static int apple_dart_map_pages(struct iommu_domain *domain, unsigned long iova,
  312. phys_addr_t paddr, size_t pgsize,
  313. size_t pgcount, int prot, gfp_t gfp,
  314. size_t *mapped)
  315. {
  316. struct apple_dart_domain *dart_domain = to_dart_domain(domain);
  317. struct io_pgtable_ops *ops = dart_domain->pgtbl_ops;
  318. if (!ops)
  319. return -ENODEV;
  320. return ops->map_pages(ops, iova, paddr, pgsize, pgcount, prot, gfp,
  321. mapped);
  322. }
  323. static size_t apple_dart_unmap_pages(struct iommu_domain *domain,
  324. unsigned long iova, size_t pgsize,
  325. size_t pgcount,
  326. struct iommu_iotlb_gather *gather)
  327. {
  328. struct apple_dart_domain *dart_domain = to_dart_domain(domain);
  329. struct io_pgtable_ops *ops = dart_domain->pgtbl_ops;
  330. return ops->unmap_pages(ops, iova, pgsize, pgcount, gather);
  331. }
  332. static void
  333. apple_dart_setup_translation(struct apple_dart_domain *domain,
  334. struct apple_dart_stream_map *stream_map)
  335. {
  336. int i;
  337. struct io_pgtable_cfg *pgtbl_cfg =
  338. &io_pgtable_ops_to_pgtable(domain->pgtbl_ops)->cfg;
  339. for (i = 0; i < pgtbl_cfg->apple_dart_cfg.n_ttbrs; ++i)
  340. apple_dart_hw_set_ttbr(stream_map, i,
  341. pgtbl_cfg->apple_dart_cfg.ttbr[i]);
  342. for (; i < DART_MAX_TTBR; ++i)
  343. apple_dart_hw_clear_ttbr(stream_map, i);
  344. apple_dart_hw_enable_translation(stream_map);
  345. apple_dart_hw_invalidate_tlb(stream_map);
  346. }
  347. static int apple_dart_finalize_domain(struct iommu_domain *domain,
  348. struct apple_dart_master_cfg *cfg)
  349. {
  350. struct apple_dart_domain *dart_domain = to_dart_domain(domain);
  351. struct apple_dart *dart = cfg->stream_maps[0].dart;
  352. struct io_pgtable_cfg pgtbl_cfg;
  353. int ret = 0;
  354. int i, j;
  355. mutex_lock(&dart_domain->init_lock);
  356. if (dart_domain->finalized)
  357. goto done;
  358. for (i = 0; i < MAX_DARTS_PER_DEVICE; ++i) {
  359. dart_domain->stream_maps[i].dart = cfg->stream_maps[i].dart;
  360. for (j = 0; j < BITS_TO_LONGS(dart->num_streams); j++)
  361. atomic_long_set(&dart_domain->stream_maps[i].sidmap[j],
  362. cfg->stream_maps[i].sidmap[j]);
  363. }
  364. pgtbl_cfg = (struct io_pgtable_cfg){
  365. .pgsize_bitmap = dart->pgsize,
  366. .ias = 32,
  367. .oas = dart->hw->oas,
  368. .coherent_walk = 1,
  369. .iommu_dev = dart->dev,
  370. };
  371. dart_domain->pgtbl_ops =
  372. alloc_io_pgtable_ops(dart->hw->fmt, &pgtbl_cfg, domain);
  373. if (!dart_domain->pgtbl_ops) {
  374. ret = -ENOMEM;
  375. goto done;
  376. }
  377. domain->pgsize_bitmap = pgtbl_cfg.pgsize_bitmap;
  378. domain->geometry.aperture_start = 0;
  379. domain->geometry.aperture_end = DMA_BIT_MASK(32);
  380. domain->geometry.force_aperture = true;
  381. dart_domain->finalized = true;
  382. done:
  383. mutex_unlock(&dart_domain->init_lock);
  384. return ret;
  385. }
  386. static int
  387. apple_dart_mod_streams(struct apple_dart_atomic_stream_map *domain_maps,
  388. struct apple_dart_stream_map *master_maps,
  389. bool add_streams)
  390. {
  391. int i, j;
  392. for (i = 0; i < MAX_DARTS_PER_DEVICE; ++i) {
  393. if (domain_maps[i].dart != master_maps[i].dart)
  394. return -EINVAL;
  395. }
  396. for (i = 0; i < MAX_DARTS_PER_DEVICE; ++i) {
  397. if (!domain_maps[i].dart)
  398. break;
  399. for (j = 0; j < BITS_TO_LONGS(domain_maps[i].dart->num_streams); j++) {
  400. if (add_streams)
  401. atomic_long_or(master_maps[i].sidmap[j],
  402. &domain_maps[i].sidmap[j]);
  403. else
  404. atomic_long_and(~master_maps[i].sidmap[j],
  405. &domain_maps[i].sidmap[j]);
  406. }
  407. }
  408. return 0;
  409. }
  410. static int apple_dart_domain_add_streams(struct apple_dart_domain *domain,
  411. struct apple_dart_master_cfg *cfg)
  412. {
  413. return apple_dart_mod_streams(domain->stream_maps, cfg->stream_maps,
  414. true);
  415. }
  416. static int apple_dart_domain_remove_streams(struct apple_dart_domain *domain,
  417. struct apple_dart_master_cfg *cfg)
  418. {
  419. return apple_dart_mod_streams(domain->stream_maps, cfg->stream_maps,
  420. false);
  421. }
  422. static int apple_dart_attach_dev(struct iommu_domain *domain,
  423. struct device *dev)
  424. {
  425. int ret, i;
  426. struct apple_dart_stream_map *stream_map;
  427. struct apple_dart_master_cfg *cfg = dev_iommu_priv_get(dev);
  428. struct apple_dart_domain *dart_domain = to_dart_domain(domain);
  429. if (cfg->stream_maps[0].dart->force_bypass &&
  430. domain->type != IOMMU_DOMAIN_IDENTITY)
  431. return -EINVAL;
  432. if (!cfg->stream_maps[0].dart->supports_bypass &&
  433. domain->type == IOMMU_DOMAIN_IDENTITY)
  434. return -EINVAL;
  435. ret = apple_dart_finalize_domain(domain, cfg);
  436. if (ret)
  437. return ret;
  438. switch (domain->type) {
  439. case IOMMU_DOMAIN_DMA:
  440. case IOMMU_DOMAIN_UNMANAGED:
  441. ret = apple_dart_domain_add_streams(dart_domain, cfg);
  442. if (ret)
  443. return ret;
  444. for_each_stream_map(i, cfg, stream_map)
  445. apple_dart_setup_translation(dart_domain, stream_map);
  446. break;
  447. case IOMMU_DOMAIN_BLOCKED:
  448. for_each_stream_map(i, cfg, stream_map)
  449. apple_dart_hw_disable_dma(stream_map);
  450. break;
  451. case IOMMU_DOMAIN_IDENTITY:
  452. for_each_stream_map(i, cfg, stream_map)
  453. apple_dart_hw_enable_bypass(stream_map);
  454. break;
  455. }
  456. return ret;
  457. }
  458. static void apple_dart_detach_dev(struct iommu_domain *domain,
  459. struct device *dev)
  460. {
  461. int i;
  462. struct apple_dart_stream_map *stream_map;
  463. struct apple_dart_master_cfg *cfg = dev_iommu_priv_get(dev);
  464. struct apple_dart_domain *dart_domain = to_dart_domain(domain);
  465. for_each_stream_map(i, cfg, stream_map)
  466. apple_dart_hw_disable_dma(stream_map);
  467. if (domain->type == IOMMU_DOMAIN_DMA ||
  468. domain->type == IOMMU_DOMAIN_UNMANAGED)
  469. apple_dart_domain_remove_streams(dart_domain, cfg);
  470. }
  471. static struct iommu_device *apple_dart_probe_device(struct device *dev)
  472. {
  473. struct apple_dart_master_cfg *cfg = dev_iommu_priv_get(dev);
  474. struct apple_dart_stream_map *stream_map;
  475. int i;
  476. if (!cfg)
  477. return ERR_PTR(-ENODEV);
  478. for_each_stream_map(i, cfg, stream_map)
  479. device_link_add(
  480. dev, stream_map->dart->dev,
  481. DL_FLAG_PM_RUNTIME | DL_FLAG_AUTOREMOVE_SUPPLIER);
  482. return &cfg->stream_maps[0].dart->iommu;
  483. }
  484. static void apple_dart_release_device(struct device *dev)
  485. {
  486. struct apple_dart_master_cfg *cfg = dev_iommu_priv_get(dev);
  487. dev_iommu_priv_set(dev, NULL);
  488. kfree(cfg);
  489. }
  490. static struct iommu_domain *apple_dart_domain_alloc(unsigned int type)
  491. {
  492. struct apple_dart_domain *dart_domain;
  493. if (type != IOMMU_DOMAIN_DMA && type != IOMMU_DOMAIN_UNMANAGED &&
  494. type != IOMMU_DOMAIN_IDENTITY && type != IOMMU_DOMAIN_BLOCKED)
  495. return NULL;
  496. dart_domain = kzalloc(sizeof(*dart_domain), GFP_KERNEL);
  497. if (!dart_domain)
  498. return NULL;
  499. mutex_init(&dart_domain->init_lock);
  500. /* no need to allocate pgtbl_ops or do any other finalization steps */
  501. if (type == IOMMU_DOMAIN_IDENTITY || type == IOMMU_DOMAIN_BLOCKED)
  502. dart_domain->finalized = true;
  503. return &dart_domain->domain;
  504. }
  505. static void apple_dart_domain_free(struct iommu_domain *domain)
  506. {
  507. struct apple_dart_domain *dart_domain = to_dart_domain(domain);
  508. if (dart_domain->pgtbl_ops)
  509. free_io_pgtable_ops(dart_domain->pgtbl_ops);
  510. kfree(dart_domain);
  511. }
  512. static int apple_dart_of_xlate(struct device *dev, struct of_phandle_args *args)
  513. {
  514. struct apple_dart_master_cfg *cfg = dev_iommu_priv_get(dev);
  515. struct platform_device *iommu_pdev = of_find_device_by_node(args->np);
  516. struct apple_dart *dart = platform_get_drvdata(iommu_pdev);
  517. struct apple_dart *cfg_dart;
  518. int i, sid;
  519. if (args->args_count != 1)
  520. return -EINVAL;
  521. sid = args->args[0];
  522. if (!cfg)
  523. cfg = kzalloc(sizeof(*cfg), GFP_KERNEL);
  524. if (!cfg)
  525. return -ENOMEM;
  526. dev_iommu_priv_set(dev, cfg);
  527. cfg_dart = cfg->stream_maps[0].dart;
  528. if (cfg_dart) {
  529. if (cfg_dart->supports_bypass != dart->supports_bypass)
  530. return -EINVAL;
  531. if (cfg_dart->force_bypass != dart->force_bypass)
  532. return -EINVAL;
  533. if (cfg_dart->pgsize != dart->pgsize)
  534. return -EINVAL;
  535. }
  536. for (i = 0; i < MAX_DARTS_PER_DEVICE; ++i) {
  537. if (cfg->stream_maps[i].dart == dart) {
  538. set_bit(sid, cfg->stream_maps[i].sidmap);
  539. return 0;
  540. }
  541. }
  542. for (i = 0; i < MAX_DARTS_PER_DEVICE; ++i) {
  543. if (!cfg->stream_maps[i].dart) {
  544. cfg->stream_maps[i].dart = dart;
  545. set_bit(sid, cfg->stream_maps[i].sidmap);
  546. return 0;
  547. }
  548. }
  549. return -EINVAL;
  550. }
  551. static DEFINE_MUTEX(apple_dart_groups_lock);
  552. static void apple_dart_release_group(void *iommu_data)
  553. {
  554. int i, sid;
  555. struct apple_dart_stream_map *stream_map;
  556. struct apple_dart_master_cfg *group_master_cfg = iommu_data;
  557. mutex_lock(&apple_dart_groups_lock);
  558. for_each_stream_map(i, group_master_cfg, stream_map)
  559. for_each_set_bit(sid, stream_map->sidmap, stream_map->dart->num_streams)
  560. stream_map->dart->sid2group[sid] = NULL;
  561. kfree(iommu_data);
  562. mutex_unlock(&apple_dart_groups_lock);
  563. }
  564. static int apple_dart_merge_master_cfg(struct apple_dart_master_cfg *dst,
  565. struct apple_dart_master_cfg *src)
  566. {
  567. /*
  568. * We know that this function is only called for groups returned from
  569. * pci_device_group and that all Apple Silicon platforms never spread
  570. * PCIe devices from the same bus across multiple DARTs such that we can
  571. * just assume that both src and dst only have the same single DART.
  572. */
  573. if (src->stream_maps[1].dart)
  574. return -EINVAL;
  575. if (dst->stream_maps[1].dart)
  576. return -EINVAL;
  577. if (src->stream_maps[0].dart != dst->stream_maps[0].dart)
  578. return -EINVAL;
  579. bitmap_or(dst->stream_maps[0].sidmap,
  580. dst->stream_maps[0].sidmap,
  581. src->stream_maps[0].sidmap,
  582. dst->stream_maps[0].dart->num_streams);
  583. return 0;
  584. }
  585. static struct iommu_group *apple_dart_device_group(struct device *dev)
  586. {
  587. int i, sid;
  588. struct apple_dart_master_cfg *cfg = dev_iommu_priv_get(dev);
  589. struct apple_dart_stream_map *stream_map;
  590. struct apple_dart_master_cfg *group_master_cfg;
  591. struct iommu_group *group = NULL;
  592. struct iommu_group *res = ERR_PTR(-EINVAL);
  593. mutex_lock(&apple_dart_groups_lock);
  594. for_each_stream_map(i, cfg, stream_map) {
  595. for_each_set_bit(sid, stream_map->sidmap, stream_map->dart->num_streams) {
  596. struct iommu_group *stream_group =
  597. stream_map->dart->sid2group[sid];
  598. if (group && group != stream_group) {
  599. res = ERR_PTR(-EINVAL);
  600. goto out;
  601. }
  602. group = stream_group;
  603. }
  604. }
  605. if (group) {
  606. res = iommu_group_ref_get(group);
  607. goto out;
  608. }
  609. #ifdef CONFIG_PCI
  610. if (dev_is_pci(dev))
  611. group = pci_device_group(dev);
  612. else
  613. #endif
  614. group = generic_device_group(dev);
  615. res = ERR_PTR(-ENOMEM);
  616. if (!group)
  617. goto out;
  618. group_master_cfg = iommu_group_get_iommudata(group);
  619. if (group_master_cfg) {
  620. int ret;
  621. ret = apple_dart_merge_master_cfg(group_master_cfg, cfg);
  622. if (ret) {
  623. dev_err(dev, "Failed to merge DART IOMMU grups.\n");
  624. iommu_group_put(group);
  625. res = ERR_PTR(ret);
  626. goto out;
  627. }
  628. } else {
  629. group_master_cfg = kmemdup(cfg, sizeof(*group_master_cfg),
  630. GFP_KERNEL);
  631. if (!group_master_cfg) {
  632. iommu_group_put(group);
  633. goto out;
  634. }
  635. iommu_group_set_iommudata(group, group_master_cfg,
  636. apple_dart_release_group);
  637. }
  638. for_each_stream_map(i, cfg, stream_map)
  639. for_each_set_bit(sid, stream_map->sidmap, stream_map->dart->num_streams)
  640. stream_map->dart->sid2group[sid] = group;
  641. res = group;
  642. out:
  643. mutex_unlock(&apple_dart_groups_lock);
  644. return res;
  645. }
  646. static int apple_dart_def_domain_type(struct device *dev)
  647. {
  648. struct apple_dart_master_cfg *cfg = dev_iommu_priv_get(dev);
  649. if (cfg->stream_maps[0].dart->force_bypass)
  650. return IOMMU_DOMAIN_IDENTITY;
  651. if (!cfg->stream_maps[0].dart->supports_bypass)
  652. return IOMMU_DOMAIN_DMA;
  653. return 0;
  654. }
  655. #ifndef CONFIG_PCIE_APPLE_MSI_DOORBELL_ADDR
  656. /* Keep things compiling when CONFIG_PCI_APPLE isn't selected */
  657. #define CONFIG_PCIE_APPLE_MSI_DOORBELL_ADDR 0
  658. #endif
  659. #define DOORBELL_ADDR (CONFIG_PCIE_APPLE_MSI_DOORBELL_ADDR & PAGE_MASK)
  660. static void apple_dart_get_resv_regions(struct device *dev,
  661. struct list_head *head)
  662. {
  663. if (IS_ENABLED(CONFIG_PCIE_APPLE) && dev_is_pci(dev)) {
  664. struct iommu_resv_region *region;
  665. int prot = IOMMU_WRITE | IOMMU_NOEXEC | IOMMU_MMIO;
  666. region = iommu_alloc_resv_region(DOORBELL_ADDR,
  667. PAGE_SIZE, prot,
  668. IOMMU_RESV_MSI, GFP_KERNEL);
  669. if (!region)
  670. return;
  671. list_add_tail(&region->list, head);
  672. }
  673. iommu_dma_get_resv_regions(dev, head);
  674. }
  675. static const struct iommu_ops apple_dart_iommu_ops = {
  676. .domain_alloc = apple_dart_domain_alloc,
  677. .probe_device = apple_dart_probe_device,
  678. .release_device = apple_dart_release_device,
  679. .device_group = apple_dart_device_group,
  680. .of_xlate = apple_dart_of_xlate,
  681. .def_domain_type = apple_dart_def_domain_type,
  682. .get_resv_regions = apple_dart_get_resv_regions,
  683. .pgsize_bitmap = -1UL, /* Restricted during dart probe */
  684. .owner = THIS_MODULE,
  685. .default_domain_ops = &(const struct iommu_domain_ops) {
  686. .attach_dev = apple_dart_attach_dev,
  687. .detach_dev = apple_dart_detach_dev,
  688. .map_pages = apple_dart_map_pages,
  689. .unmap_pages = apple_dart_unmap_pages,
  690. .flush_iotlb_all = apple_dart_flush_iotlb_all,
  691. .iotlb_sync = apple_dart_iotlb_sync,
  692. .iotlb_sync_map = apple_dart_iotlb_sync_map,
  693. .iova_to_phys = apple_dart_iova_to_phys,
  694. .free = apple_dart_domain_free,
  695. }
  696. };
  697. static irqreturn_t apple_dart_irq(int irq, void *dev)
  698. {
  699. struct apple_dart *dart = dev;
  700. const char *fault_name = NULL;
  701. u32 error = readl(dart->regs + DART_ERROR);
  702. u32 error_code = FIELD_GET(DART_ERROR_CODE, error);
  703. u32 addr_lo = readl(dart->regs + DART_ERROR_ADDR_LO);
  704. u32 addr_hi = readl(dart->regs + DART_ERROR_ADDR_HI);
  705. u64 addr = addr_lo | (((u64)addr_hi) << 32);
  706. u8 stream_idx = FIELD_GET(DART_ERROR_STREAM, error);
  707. if (!(error & DART_ERROR_FLAG))
  708. return IRQ_NONE;
  709. /* there should only be a single bit set but let's use == to be sure */
  710. if (error_code == DART_ERROR_READ_FAULT)
  711. fault_name = "READ FAULT";
  712. else if (error_code == DART_ERROR_WRITE_FAULT)
  713. fault_name = "WRITE FAULT";
  714. else if (error_code == DART_ERROR_NO_PTE)
  715. fault_name = "NO PTE FOR IOVA";
  716. else if (error_code == DART_ERROR_NO_PMD)
  717. fault_name = "NO PMD FOR IOVA";
  718. else if (error_code == DART_ERROR_NO_TTBR)
  719. fault_name = "NO TTBR FOR IOVA";
  720. else
  721. fault_name = "unknown";
  722. dev_err_ratelimited(
  723. dart->dev,
  724. "translation fault: status:0x%x stream:%d code:0x%x (%s) at 0x%llx",
  725. error, stream_idx, error_code, fault_name, addr);
  726. writel(error, dart->regs + DART_ERROR);
  727. return IRQ_HANDLED;
  728. }
  729. static int apple_dart_probe(struct platform_device *pdev)
  730. {
  731. int ret;
  732. u32 dart_params[2];
  733. struct resource *res;
  734. struct apple_dart *dart;
  735. struct device *dev = &pdev->dev;
  736. dart = devm_kzalloc(dev, sizeof(*dart), GFP_KERNEL);
  737. if (!dart)
  738. return -ENOMEM;
  739. dart->dev = dev;
  740. dart->hw = of_device_get_match_data(dev);
  741. spin_lock_init(&dart->lock);
  742. dart->regs = devm_platform_get_and_ioremap_resource(pdev, 0, &res);
  743. if (IS_ERR(dart->regs))
  744. return PTR_ERR(dart->regs);
  745. if (resource_size(res) < 0x4000) {
  746. dev_err(dev, "MMIO region too small (%pr)\n", res);
  747. return -EINVAL;
  748. }
  749. dart->irq = platform_get_irq(pdev, 0);
  750. if (dart->irq < 0)
  751. return -ENODEV;
  752. ret = devm_clk_bulk_get_all(dev, &dart->clks);
  753. if (ret < 0)
  754. return ret;
  755. dart->num_clks = ret;
  756. ret = clk_bulk_prepare_enable(dart->num_clks, dart->clks);
  757. if (ret)
  758. return ret;
  759. dart_params[0] = readl(dart->regs + DART_PARAMS1);
  760. dart_params[1] = readl(dart->regs + DART_PARAMS2);
  761. dart->pgsize = 1 << FIELD_GET(DART_PARAMS_PAGE_SHIFT, dart_params[0]);
  762. dart->supports_bypass = dart_params[1] & DART_PARAMS_BYPASS_SUPPORT;
  763. dart->num_streams = dart->hw->max_sid_count;
  764. if (dart->num_streams > DART_MAX_STREAMS) {
  765. dev_err(&pdev->dev, "Too many streams (%d > %d)\n",
  766. dart->num_streams, DART_MAX_STREAMS);
  767. ret = -EINVAL;
  768. goto err_clk_disable;
  769. }
  770. dart->force_bypass = dart->pgsize > PAGE_SIZE;
  771. ret = apple_dart_hw_reset(dart);
  772. if (ret)
  773. goto err_clk_disable;
  774. ret = request_irq(dart->irq, apple_dart_irq, IRQF_SHARED,
  775. "apple-dart fault handler", dart);
  776. if (ret)
  777. goto err_clk_disable;
  778. platform_set_drvdata(pdev, dart);
  779. ret = iommu_device_sysfs_add(&dart->iommu, dev, NULL, "apple-dart.%s",
  780. dev_name(&pdev->dev));
  781. if (ret)
  782. goto err_free_irq;
  783. ret = iommu_device_register(&dart->iommu, &apple_dart_iommu_ops, dev);
  784. if (ret)
  785. goto err_sysfs_remove;
  786. dev_info(
  787. &pdev->dev,
  788. "DART [pagesize %x, %d streams, bypass support: %d, bypass forced: %d] initialized\n",
  789. dart->pgsize, dart->num_streams, dart->supports_bypass, dart->force_bypass);
  790. return 0;
  791. err_sysfs_remove:
  792. iommu_device_sysfs_remove(&dart->iommu);
  793. err_free_irq:
  794. free_irq(dart->irq, dart);
  795. err_clk_disable:
  796. clk_bulk_disable_unprepare(dart->num_clks, dart->clks);
  797. return ret;
  798. }
  799. static int apple_dart_remove(struct platform_device *pdev)
  800. {
  801. struct apple_dart *dart = platform_get_drvdata(pdev);
  802. apple_dart_hw_reset(dart);
  803. free_irq(dart->irq, dart);
  804. iommu_device_unregister(&dart->iommu);
  805. iommu_device_sysfs_remove(&dart->iommu);
  806. clk_bulk_disable_unprepare(dart->num_clks, dart->clks);
  807. return 0;
  808. }
  809. static const struct apple_dart_hw apple_dart_hw_t8103 = {
  810. .oas = 36,
  811. .fmt = APPLE_DART,
  812. .max_sid_count = 16,
  813. };
  814. static const struct apple_dart_hw apple_dart_hw_t6000 = {
  815. .oas = 42,
  816. .fmt = APPLE_DART2,
  817. .max_sid_count = 16,
  818. };
  819. static __maybe_unused int apple_dart_suspend(struct device *dev)
  820. {
  821. struct apple_dart *dart = dev_get_drvdata(dev);
  822. unsigned int sid, idx;
  823. for (sid = 0; sid < dart->num_streams; sid++) {
  824. dart->save_tcr[sid] = readl_relaxed(dart->regs + DART_TCR(sid));
  825. for (idx = 0; idx < DART_MAX_TTBR; idx++)
  826. dart->save_ttbr[sid][idx] =
  827. readl(dart->regs + DART_TTBR(sid, idx));
  828. }
  829. return 0;
  830. }
  831. static __maybe_unused int apple_dart_resume(struct device *dev)
  832. {
  833. struct apple_dart *dart = dev_get_drvdata(dev);
  834. unsigned int sid, idx;
  835. int ret;
  836. ret = apple_dart_hw_reset(dart);
  837. if (ret) {
  838. dev_err(dev, "Failed to reset DART on resume\n");
  839. return ret;
  840. }
  841. for (sid = 0; sid < dart->num_streams; sid++) {
  842. for (idx = 0; idx < DART_MAX_TTBR; idx++)
  843. writel(dart->save_ttbr[sid][idx],
  844. dart->regs + DART_TTBR(sid, idx));
  845. writel(dart->save_tcr[sid], dart->regs + DART_TCR(sid));
  846. }
  847. return 0;
  848. }
  849. DEFINE_SIMPLE_DEV_PM_OPS(apple_dart_pm_ops, apple_dart_suspend, apple_dart_resume);
  850. static const struct of_device_id apple_dart_of_match[] = {
  851. { .compatible = "apple,t8103-dart", .data = &apple_dart_hw_t8103 },
  852. { .compatible = "apple,t6000-dart", .data = &apple_dart_hw_t6000 },
  853. {},
  854. };
  855. MODULE_DEVICE_TABLE(of, apple_dart_of_match);
  856. static struct platform_driver apple_dart_driver = {
  857. .driver = {
  858. .name = "apple-dart",
  859. .of_match_table = apple_dart_of_match,
  860. .suppress_bind_attrs = true,
  861. .pm = pm_sleep_ptr(&apple_dart_pm_ops),
  862. },
  863. .probe = apple_dart_probe,
  864. .remove = apple_dart_remove,
  865. };
  866. module_platform_driver(apple_dart_driver);
  867. MODULE_DESCRIPTION("IOMMU API for Apple's DART");
  868. MODULE_AUTHOR("Sven Peter <sven@svenpeter.dev>");
  869. MODULE_LICENSE("GPL v2");