adreno_a6xx_hwsched.c 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Copyright (c) 2020-2021, The Linux Foundation. All rights reserved.
  4. * Copyright (c) 2022-2024, Qualcomm Innovation Center, Inc. All rights reserved.
  5. */
  6. #include <linux/clk.h>
  7. #include <linux/component.h>
  8. #include <linux/interconnect.h>
  9. #include "adreno.h"
  10. #include "adreno_a6xx.h"
  11. #include "adreno_a6xx_hwsched.h"
  12. #include "adreno_hfi.h"
  13. #include "adreno_snapshot.h"
  14. #include "kgsl_bus.h"
  15. #include "kgsl_device.h"
  16. #include "kgsl_trace.h"
  17. static size_t adreno_hwsched_snapshot_rb(struct kgsl_device *device, u8 *buf,
  18. size_t remain, void *priv)
  19. {
  20. struct kgsl_snapshot_rb_v2 *header = (struct kgsl_snapshot_rb_v2 *)buf;
  21. u32 *data = (u32 *)(buf + sizeof(*header));
  22. struct kgsl_memdesc *rb = (struct kgsl_memdesc *)priv;
  23. if (remain < rb->size + sizeof(*header)) {
  24. SNAPSHOT_ERR_NOMEM(device, "RB");
  25. return 0;
  26. }
  27. header->start = 0;
  28. header->end = rb->size >> 2;
  29. header->rptr = 0;
  30. header->rbsize = rb->size >> 2;
  31. header->count = rb->size >> 2;
  32. header->timestamp_queued = 0;
  33. header->timestamp_retired = 0;
  34. header->gpuaddr = rb->gpuaddr;
  35. header->id = 0;
  36. memcpy(data, rb->hostptr, rb->size);
  37. return rb->size + sizeof(*header);
  38. }
  39. static void a6xx_hwsched_snapshot_preemption_record(struct kgsl_device *device,
  40. struct kgsl_snapshot *snapshot, struct kgsl_memdesc *md, u64 offset)
  41. {
  42. struct kgsl_snapshot_section_header *section_header =
  43. (struct kgsl_snapshot_section_header *)snapshot->ptr;
  44. u8 *dest = snapshot->ptr + sizeof(*section_header);
  45. struct kgsl_snapshot_gpu_object_v2 *header =
  46. (struct kgsl_snapshot_gpu_object_v2 *)dest;
  47. const struct adreno_a6xx_core *a6xx_core = to_a6xx_core(ADRENO_DEVICE(device));
  48. u64 ctxt_record_size = A6XX_CP_CTXRECORD_SIZE_IN_BYTES;
  49. size_t section_size;
  50. if (a6xx_core->ctxt_record_size)
  51. ctxt_record_size = a6xx_core->ctxt_record_size;
  52. ctxt_record_size = min_t(u64, ctxt_record_size, device->snapshot_ctxt_record_size);
  53. section_size = sizeof(*section_header) + sizeof(*header) + ctxt_record_size;
  54. if (snapshot->remain < section_size) {
  55. SNAPSHOT_ERR_NOMEM(device, "PREEMPTION RECORD");
  56. return;
  57. }
  58. section_header->magic = SNAPSHOT_SECTION_MAGIC;
  59. section_header->id = KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2;
  60. section_header->size = section_size;
  61. header->size = ctxt_record_size >> 2;
  62. header->gpuaddr = md->gpuaddr + offset;
  63. header->ptbase =
  64. kgsl_mmu_pagetable_get_ttbr0(device->mmu.defaultpagetable);
  65. header->type = SNAPSHOT_GPU_OBJECT_GLOBAL;
  66. dest += sizeof(*header);
  67. memcpy(dest, md->hostptr + offset, ctxt_record_size);
  68. snapshot->ptr += section_header->size;
  69. snapshot->remain -= section_header->size;
  70. snapshot->size += section_header->size;
  71. }
  72. static void snapshot_preemption_records(struct kgsl_device *device,
  73. struct kgsl_snapshot *snapshot, struct kgsl_memdesc *md)
  74. {
  75. const struct adreno_a6xx_core *a6xx_core =
  76. to_a6xx_core(ADRENO_DEVICE(device));
  77. u64 ctxt_record_size = A6XX_CP_CTXRECORD_SIZE_IN_BYTES;
  78. u64 offset;
  79. if (a6xx_core->ctxt_record_size)
  80. ctxt_record_size = a6xx_core->ctxt_record_size;
  81. /* All preemption records exist as a single mem alloc entry */
  82. for (offset = 0; offset < md->size; offset += ctxt_record_size)
  83. a6xx_hwsched_snapshot_preemption_record(device, snapshot, md,
  84. offset);
  85. }
  86. static void *get_rb_hostptr(struct adreno_device *adreno_dev,
  87. u64 gpuaddr, u32 size)
  88. {
  89. struct a6xx_hwsched_hfi *hw_hfi = to_a6xx_hwsched_hfi(adreno_dev);
  90. u64 offset;
  91. u32 i;
  92. for (i = 0; i < hw_hfi->mem_alloc_entries; i++) {
  93. struct kgsl_memdesc *md = hw_hfi->mem_alloc_table[i].md;
  94. if (md && (gpuaddr >= md->gpuaddr) &&
  95. ((gpuaddr + size) <= (md->gpuaddr + md->size))) {
  96. offset = gpuaddr - md->gpuaddr;
  97. return md->hostptr + offset;
  98. }
  99. }
  100. return NULL;
  101. }
  102. static u32 a6xx_copy_gpu_global(void *out, void *in, u32 size)
  103. {
  104. if (out && in) {
  105. memcpy(out, in, size);
  106. return size;
  107. }
  108. return 0;
  109. }
  110. static void adreno_hwsched_snapshot_rb_payload(struct adreno_device *adreno_dev,
  111. struct kgsl_snapshot *snapshot, struct payload_section *payload)
  112. {
  113. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  114. struct kgsl_snapshot_section_header *section_header =
  115. (struct kgsl_snapshot_section_header *)snapshot->ptr;
  116. u8 *buf = snapshot->ptr + sizeof(*section_header);
  117. struct kgsl_snapshot_rb_v2 *header = (struct kgsl_snapshot_rb_v2 *)buf;
  118. u32 *data = (u32 *)(buf + sizeof(*header));
  119. u32 size = adreno_hwsched_parse_payload(payload, KEY_RB_SIZEDWORDS) << 2;
  120. u64 lo, hi, gpuaddr;
  121. void *rb_hostptr;
  122. char str[16];
  123. lo = adreno_hwsched_parse_payload(payload, KEY_RB_GPUADDR_LO);
  124. hi = adreno_hwsched_parse_payload(payload, KEY_RB_GPUADDR_HI);
  125. gpuaddr = hi << 32 | lo;
  126. /* Sanity check to make sure there is enough for the header */
  127. if (snapshot->remain < sizeof(*section_header))
  128. goto err;
  129. rb_hostptr = get_rb_hostptr(adreno_dev, gpuaddr, size);
  130. /* If the gpuaddress and size don't match any allocation, then abort */
  131. if (((snapshot->remain - sizeof(*section_header)) <
  132. (size + sizeof(*header))) ||
  133. !a6xx_copy_gpu_global(data, rb_hostptr, size))
  134. goto err;
  135. if (device->dump_all_ibs) {
  136. u64 rbaddr;
  137. kgsl_regread64(device, A6XX_CP_RB_BASE,
  138. A6XX_CP_RB_BASE_HI, &rbaddr);
  139. /* Parse all IBs from current RB */
  140. if (rbaddr == gpuaddr)
  141. adreno_snapshot_dump_all_ibs(device, rb_hostptr, snapshot);
  142. }
  143. header->start = 0;
  144. header->end = size >> 2;
  145. header->rptr = adreno_hwsched_parse_payload(payload, KEY_RB_RPTR);
  146. header->wptr = adreno_hwsched_parse_payload(payload, KEY_RB_WPTR);
  147. header->rbsize = size >> 2;
  148. header->count = size >> 2;
  149. header->timestamp_queued = adreno_hwsched_parse_payload(payload,
  150. KEY_RB_QUEUED_TS);
  151. header->timestamp_retired = adreno_hwsched_parse_payload(payload,
  152. KEY_RB_RETIRED_TS);
  153. header->gpuaddr = gpuaddr;
  154. header->id = adreno_hwsched_parse_payload(payload, KEY_RB_ID);
  155. section_header->magic = SNAPSHOT_SECTION_MAGIC;
  156. section_header->id = KGSL_SNAPSHOT_SECTION_RB_V2;
  157. section_header->size = size + sizeof(*header) + sizeof(*section_header);
  158. snapshot->ptr += section_header->size;
  159. snapshot->remain -= section_header->size;
  160. snapshot->size += section_header->size;
  161. return;
  162. err:
  163. snprintf(str, sizeof(str), "RB addr:0x%llx", gpuaddr);
  164. SNAPSHOT_ERR_NOMEM(device, str);
  165. }
  166. static bool parse_payload_rb_legacy(struct adreno_device *adreno_dev,
  167. struct kgsl_snapshot *snapshot)
  168. {
  169. struct hfi_context_bad_cmd_legacy *cmd = adreno_dev->hwsched.ctxt_bad;
  170. u32 i = 0, payload_bytes;
  171. void *start;
  172. bool ret = false;
  173. /* Skip if we didn't receive a context bad HFI */
  174. if (!cmd->hdr)
  175. return false;
  176. payload_bytes = (MSG_HDR_GET_SIZE(cmd->hdr) << 2) -
  177. offsetof(struct hfi_context_bad_cmd_legacy, payload);
  178. start = &cmd->payload[0];
  179. while (i < payload_bytes) {
  180. struct payload_section *payload = start + i;
  181. if (payload->type == PAYLOAD_RB) {
  182. adreno_hwsched_snapshot_rb_payload(adreno_dev, snapshot, payload);
  183. ret = true;
  184. }
  185. i += sizeof(*payload) + (payload->dwords << 2);
  186. }
  187. return ret;
  188. }
  189. static bool parse_payload_rb(struct adreno_device *adreno_dev,
  190. struct kgsl_snapshot *snapshot)
  191. {
  192. struct hfi_context_bad_cmd *cmd = adreno_dev->hwsched.ctxt_bad;
  193. u32 i = 0, payload_bytes;
  194. void *start;
  195. bool ret = false;
  196. /* Skip if we didn't receive a context bad HFI */
  197. if (!cmd->hdr)
  198. return false;
  199. payload_bytes = (MSG_HDR_GET_SIZE(cmd->hdr) << 2) -
  200. offsetof(struct hfi_context_bad_cmd, payload);
  201. start = &cmd->payload[0];
  202. while (i < payload_bytes) {
  203. struct payload_section *payload = start + i;
  204. if (payload->type == PAYLOAD_RB) {
  205. adreno_hwsched_snapshot_rb_payload(adreno_dev,
  206. snapshot, payload);
  207. ret = true;
  208. }
  209. i += sizeof(*payload) + (payload->dwords << 2);
  210. }
  211. return ret;
  212. }
  213. void a6xx_hwsched_snapshot(struct adreno_device *adreno_dev,
  214. struct kgsl_snapshot *snapshot)
  215. {
  216. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  217. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  218. struct a6xx_hwsched_hfi *hw_hfi = to_a6xx_hwsched_hfi(adreno_dev);
  219. u32 i;
  220. bool skip_memkind_rb = false;
  221. bool parse_payload;
  222. a6xx_gmu_snapshot(adreno_dev, snapshot);
  223. adreno_hwsched_parse_fault_cmdobj(adreno_dev, snapshot);
  224. /*
  225. * First try to dump ringbuffers using context bad HFI payloads
  226. * because they have all the ringbuffer parameters. If ringbuffer
  227. * payloads are not present, fall back to dumping ringbuffers
  228. * based on MEMKIND_RB
  229. */
  230. if (GMU_VER_MINOR(gmu->ver.hfi) < 2)
  231. parse_payload = parse_payload_rb_legacy(adreno_dev, snapshot);
  232. else
  233. parse_payload = parse_payload_rb(adreno_dev, snapshot);
  234. if (parse_payload)
  235. skip_memkind_rb = true;
  236. for (i = 0; i < hw_hfi->mem_alloc_entries; i++) {
  237. struct hfi_mem_alloc_entry *entry = &hw_hfi->mem_alloc_table[i];
  238. if (entry->desc.mem_kind == HFI_MEMKIND_RB && !skip_memkind_rb)
  239. kgsl_snapshot_add_section(device,
  240. KGSL_SNAPSHOT_SECTION_RB_V2,
  241. snapshot, adreno_hwsched_snapshot_rb,
  242. entry->md);
  243. if (entry->desc.mem_kind == HFI_MEMKIND_SCRATCH)
  244. kgsl_snapshot_add_section(device,
  245. KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
  246. snapshot, adreno_snapshot_global,
  247. entry->md);
  248. if (entry->desc.mem_kind == HFI_MEMKIND_PROFILE)
  249. kgsl_snapshot_add_section(device,
  250. KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
  251. snapshot, adreno_snapshot_global,
  252. entry->md);
  253. if (entry->desc.mem_kind == HFI_MEMKIND_CSW_SMMU_INFO)
  254. kgsl_snapshot_add_section(device,
  255. KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
  256. snapshot, adreno_snapshot_global,
  257. entry->md);
  258. if (entry->desc.mem_kind == HFI_MEMKIND_CSW_PRIV_NON_SECURE)
  259. snapshot_preemption_records(device, snapshot,
  260. entry->md);
  261. if (entry->desc.mem_kind == HFI_MEMKIND_PREEMPT_SCRATCH)
  262. kgsl_snapshot_add_section(device,
  263. KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
  264. snapshot, adreno_snapshot_global,
  265. entry->md);
  266. }
  267. }
  268. static int a6xx_hwsched_gmu_first_boot(struct adreno_device *adreno_dev)
  269. {
  270. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  271. struct kgsl_pwrctrl *pwr = &device->pwrctrl;
  272. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  273. int level, ret = 0;
  274. kgsl_pwrctrl_request_state(device, KGSL_STATE_AWARE);
  275. a6xx_gmu_aop_send_acd_state(gmu, adreno_dev->acd_enabled);
  276. ret = kgsl_pwrctrl_enable_cx_gdsc(device);
  277. if (ret)
  278. return ret;
  279. ret = a6xx_gmu_enable_clks(adreno_dev, GMU_MAX_PWRLEVELS - 1);
  280. if (ret)
  281. goto gdsc_off;
  282. ret = a6xx_gmu_load_fw(adreno_dev);
  283. if (ret)
  284. goto clks_gdsc_off;
  285. ret = a6xx_gmu_itcm_shadow(adreno_dev);
  286. if (ret)
  287. goto clks_gdsc_off;
  288. if (!test_bit(GMU_PRIV_PDC_RSC_LOADED, &gmu->flags)) {
  289. ret = a6xx_load_pdc_ucode(adreno_dev);
  290. if (ret)
  291. goto clks_gdsc_off;
  292. a6xx_load_rsc_ucode(adreno_dev);
  293. set_bit(GMU_PRIV_PDC_RSC_LOADED, &gmu->flags);
  294. }
  295. a6xx_gmu_register_config(adreno_dev);
  296. a6xx_gmu_version_info(adreno_dev);
  297. if (GMU_VER_MINOR(gmu->ver.hfi) < 2)
  298. set_bit(ADRENO_HWSCHED_CTX_BAD_LEGACY, &adreno_dev->hwsched.flags);
  299. a6xx_gmu_irq_enable(adreno_dev);
  300. /* Vote for minimal DDR BW for GMU to init */
  301. level = pwr->pwrlevels[pwr->default_pwrlevel].bus_min;
  302. icc_set_bw(pwr->icc_path, 0, kBps_to_icc(pwr->ddr_table[level]));
  303. /* Clear any hwsched faults that might have been left over */
  304. adreno_hwsched_clear_fault(adreno_dev);
  305. ret = a6xx_gmu_device_start(adreno_dev);
  306. if (ret)
  307. goto err;
  308. ret = a6xx_hwsched_hfi_start(adreno_dev);
  309. if (ret)
  310. goto err;
  311. icc_set_bw(pwr->icc_path, 0, 0);
  312. device->gmu_fault = false;
  313. kgsl_pwrctrl_set_state(device, KGSL_STATE_AWARE);
  314. return 0;
  315. err:
  316. a6xx_gmu_irq_disable(adreno_dev);
  317. if (device->gmu_fault) {
  318. a6xx_gmu_suspend(adreno_dev);
  319. return ret;
  320. }
  321. clks_gdsc_off:
  322. clk_bulk_disable_unprepare(gmu->num_clks, gmu->clks);
  323. gdsc_off:
  324. a6xx_gmu_disable_gdsc(adreno_dev);
  325. a6xx_rdpm_cx_freq_update(gmu, 0);
  326. return ret;
  327. }
  328. static int a6xx_hwsched_gmu_boot(struct adreno_device *adreno_dev)
  329. {
  330. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  331. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  332. int ret = 0;
  333. kgsl_pwrctrl_request_state(device, KGSL_STATE_AWARE);
  334. ret = kgsl_pwrctrl_enable_cx_gdsc(device);
  335. if (ret)
  336. return ret;
  337. ret = a6xx_gmu_enable_clks(adreno_dev, GMU_MAX_PWRLEVELS - 1);
  338. if (ret)
  339. goto gdsc_off;
  340. ret = a6xx_rscc_wakeup_sequence(adreno_dev);
  341. if (ret)
  342. goto clks_gdsc_off;
  343. ret = a6xx_gmu_load_fw(adreno_dev);
  344. if (ret)
  345. goto clks_gdsc_off;
  346. a6xx_gmu_register_config(adreno_dev);
  347. a6xx_gmu_irq_enable(adreno_dev);
  348. /* Clear any hwsched faults that might have been left over */
  349. adreno_hwsched_clear_fault(adreno_dev);
  350. ret = a6xx_gmu_device_start(adreno_dev);
  351. if (ret)
  352. goto err;
  353. ret = a6xx_hwsched_hfi_start(adreno_dev);
  354. if (ret)
  355. goto err;
  356. device->gmu_fault = false;
  357. kgsl_pwrctrl_set_state(device, KGSL_STATE_AWARE);
  358. return 0;
  359. err:
  360. a6xx_gmu_irq_disable(adreno_dev);
  361. if (device->gmu_fault) {
  362. a6xx_gmu_suspend(adreno_dev);
  363. return ret;
  364. }
  365. clks_gdsc_off:
  366. clk_bulk_disable_unprepare(gmu->num_clks, gmu->clks);
  367. gdsc_off:
  368. a6xx_gmu_disable_gdsc(adreno_dev);
  369. a6xx_rdpm_cx_freq_update(gmu, 0);
  370. return ret;
  371. }
  372. void a6xx_hwsched_active_count_put(struct adreno_device *adreno_dev)
  373. {
  374. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  375. if (WARN_ON(!mutex_is_locked(&device->mutex)))
  376. return;
  377. if (WARN(atomic_read(&device->active_cnt) == 0,
  378. "Unbalanced get/put calls to KGSL active count\n"))
  379. return;
  380. if (atomic_dec_and_test(&device->active_cnt)) {
  381. kgsl_pwrscale_update_stats(device);
  382. kgsl_pwrscale_update(device);
  383. kgsl_start_idle_timer(device);
  384. }
  385. trace_kgsl_active_count(device,
  386. (unsigned long) __builtin_return_address(0));
  387. wake_up(&device->active_cnt_wq);
  388. }
  389. static int a6xx_hwsched_notify_slumber(struct adreno_device *adreno_dev)
  390. {
  391. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  392. struct kgsl_pwrctrl *pwr = &device->pwrctrl;
  393. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  394. struct hfi_prep_slumber_cmd req;
  395. int ret;
  396. ret = CMD_MSG_HDR(req, H2F_MSG_PREPARE_SLUMBER);
  397. if (ret)
  398. return ret;
  399. req.freq = gmu->hfi.dcvs_table.gpu_level_num -
  400. pwr->default_pwrlevel - 1;
  401. req.bw = pwr->pwrlevels[pwr->default_pwrlevel].bus_freq;
  402. /* Disable the power counter so that the GMU is not busy */
  403. gmu_core_regwrite(device, A6XX_GMU_CX_GMU_POWER_COUNTER_ENABLE, 0);
  404. ret = a6xx_hfi_send_cmd_async(adreno_dev, &req, sizeof(req));
  405. /*
  406. * GEMNOC can enter power collapse state during GPU power down sequence.
  407. * This could abort CX GDSC collapse. Assert Qactive to avoid this.
  408. */
  409. if ((adreno_is_a662(adreno_dev) || adreno_is_a621(adreno_dev) ||
  410. adreno_is_a635(adreno_dev)))
  411. gmu_core_regwrite(device, A6XX_GPU_GMU_CX_GMU_CX_FALNEXT_INTF, 0x1);
  412. return ret;
  413. }
  414. static int a6xx_hwsched_gmu_power_off(struct adreno_device *adreno_dev)
  415. {
  416. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  417. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  418. int ret = 0;
  419. if (device->gmu_fault)
  420. goto error;
  421. /* Wait for the lowest idle level we requested */
  422. ret = a6xx_gmu_wait_for_lowest_idle(adreno_dev);
  423. if (ret)
  424. goto error;
  425. ret = a6xx_hwsched_notify_slumber(adreno_dev);
  426. if (ret)
  427. goto error;
  428. ret = a6xx_gmu_wait_for_idle(adreno_dev);
  429. if (ret)
  430. goto error;
  431. ret = a6xx_rscc_sleep_sequence(adreno_dev);
  432. a6xx_rdpm_mx_freq_update(gmu, 0);
  433. /* Now that we are done with GMU and GPU, Clear the GBIF */
  434. ret = a6xx_halt_gbif(adreno_dev);
  435. /* De-assert the halts */
  436. kgsl_regwrite(device, A6XX_GBIF_HALT, 0x0);
  437. a6xx_gmu_irq_disable(adreno_dev);
  438. a6xx_hwsched_hfi_stop(adreno_dev);
  439. clk_bulk_disable_unprepare(gmu->num_clks, gmu->clks);
  440. a6xx_gmu_disable_gdsc(adreno_dev);
  441. a6xx_rdpm_cx_freq_update(gmu, 0);
  442. kgsl_pwrctrl_set_state(device, KGSL_STATE_NONE);
  443. return ret;
  444. error:
  445. a6xx_gmu_irq_disable(adreno_dev);
  446. a6xx_hwsched_hfi_stop(adreno_dev);
  447. a6xx_gmu_suspend(adreno_dev);
  448. return ret;
  449. }
  450. static int a6xx_hwsched_gpu_boot(struct adreno_device *adreno_dev)
  451. {
  452. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  453. int ret;
  454. ret = kgsl_mmu_start(device);
  455. if (ret)
  456. goto err;
  457. ret = a6xx_gmu_oob_set(device, oob_gpu);
  458. if (ret)
  459. goto err;
  460. /* Clear the busy_data stats - we're starting over from scratch */
  461. memset(&adreno_dev->busy_data, 0, sizeof(adreno_dev->busy_data));
  462. /* Restore performance counter registers with saved values */
  463. adreno_perfcounter_restore(adreno_dev);
  464. a6xx_start(adreno_dev);
  465. /* Re-initialize the coresight registers if applicable */
  466. adreno_coresight_start(adreno_dev);
  467. adreno_perfcounter_start(adreno_dev);
  468. /* Clear FSR here in case it is set from a previous pagefault */
  469. kgsl_mmu_clear_fsr(&device->mmu);
  470. a6xx_enable_gpu_irq(adreno_dev);
  471. ret = a6xx_hwsched_cp_init(adreno_dev);
  472. if (ret) {
  473. a6xx_disable_gpu_irq(adreno_dev);
  474. goto err;
  475. }
  476. /*
  477. * At this point it is safe to assume that we recovered. Setting
  478. * this field allows us to take a new snapshot for the next failure
  479. * if we are prioritizing the first unrecoverable snapshot.
  480. */
  481. if (device->snapshot)
  482. device->snapshot->recovered = true;
  483. device->reset_counter++;
  484. err:
  485. a6xx_gmu_oob_clear(device, oob_gpu);
  486. if (ret)
  487. a6xx_hwsched_gmu_power_off(adreno_dev);
  488. return ret;
  489. }
  490. static void hwsched_idle_timer(struct timer_list *t)
  491. {
  492. struct kgsl_device *device = container_of(t, struct kgsl_device,
  493. idle_timer);
  494. kgsl_schedule_work(&device->idle_check_ws);
  495. }
  496. static int a6xx_hwsched_gmu_memory_init(struct adreno_device *adreno_dev)
  497. {
  498. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  499. /* GMU Virtual register bank */
  500. if (IS_ERR_OR_NULL(gmu->vrb)) {
  501. gmu->vrb = reserve_gmu_kernel_block(gmu, 0, GMU_VRB_SIZE,
  502. GMU_NONCACHED_KERNEL, 0);
  503. if (IS_ERR(gmu->vrb))
  504. return PTR_ERR(gmu->vrb);
  505. /* Populate size of the virtual register bank */
  506. gmu_core_set_vrb_register(gmu->vrb->hostptr, VRB_SIZE_IDX,
  507. gmu->vrb->size >> 2);
  508. }
  509. /* GMU trace log */
  510. if (IS_ERR_OR_NULL(gmu->trace.md)) {
  511. gmu->trace.md = reserve_gmu_kernel_block(gmu, 0,
  512. GMU_TRACE_SIZE, GMU_NONCACHED_KERNEL, 0);
  513. if (IS_ERR(gmu->trace.md))
  514. return PTR_ERR(gmu->trace.md);
  515. /* Pass trace buffer address to GMU through the VRB */
  516. gmu_core_set_vrb_register(gmu->vrb->hostptr,
  517. VRB_TRACE_BUFFER_ADDR_IDX,
  518. gmu->trace.md->gmuaddr);
  519. /* Initialize the GMU trace buffer header */
  520. gmu_core_trace_header_init(&gmu->trace);
  521. }
  522. return 0;
  523. }
  524. static int a6xx_hwsched_gmu_init(struct adreno_device *adreno_dev)
  525. {
  526. int ret;
  527. ret = a6xx_gmu_parse_fw(adreno_dev);
  528. if (ret)
  529. return ret;
  530. ret = a6xx_gmu_memory_init(adreno_dev);
  531. if (ret)
  532. return ret;
  533. ret = a6xx_hwsched_gmu_memory_init(adreno_dev);
  534. if (ret)
  535. return ret;
  536. return a6xx_hwsched_hfi_init(adreno_dev);
  537. }
  538. static void a6xx_hwsched_touch_wakeup(struct adreno_device *adreno_dev)
  539. {
  540. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  541. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  542. int ret;
  543. /*
  544. * Do not wake up a suspended device or until the first boot sequence
  545. * has been completed.
  546. */
  547. if (test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags) ||
  548. !test_bit(GMU_PRIV_FIRST_BOOT_DONE, &gmu->flags))
  549. return;
  550. if (test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
  551. goto done;
  552. kgsl_pwrctrl_request_state(device, KGSL_STATE_ACTIVE);
  553. ret = a6xx_hwsched_gmu_boot(adreno_dev);
  554. if (ret)
  555. return;
  556. ret = a6xx_hwsched_gpu_boot(adreno_dev);
  557. if (ret)
  558. return;
  559. kgsl_pwrscale_wake(device);
  560. set_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
  561. device->pwrctrl.last_stat_updated = ktime_get();
  562. kgsl_pwrctrl_set_state(device, KGSL_STATE_ACTIVE);
  563. done:
  564. /*
  565. * When waking up from a touch event we want to stay active long enough
  566. * for the user to send a draw command. The default idle timer timeout
  567. * is shorter than we want so go ahead and push the idle timer out
  568. * further for this special case
  569. */
  570. mod_timer(&device->idle_timer, jiffies +
  571. msecs_to_jiffies(adreno_wake_timeout));
  572. }
  573. static int a6xx_hwsched_boot(struct adreno_device *adreno_dev)
  574. {
  575. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  576. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  577. int ret;
  578. if (test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
  579. return 0;
  580. kgsl_pwrctrl_request_state(device, KGSL_STATE_ACTIVE);
  581. adreno_hwsched_start(adreno_dev);
  582. if (IS_ENABLED(CONFIG_QCOM_KGSL_HIBERNATION) &&
  583. !test_bit(GMU_PRIV_PDC_RSC_LOADED, &gmu->flags))
  584. ret = a6xx_hwsched_gmu_first_boot(adreno_dev);
  585. else
  586. ret = a6xx_hwsched_gmu_boot(adreno_dev);
  587. if (ret)
  588. return ret;
  589. ret = a6xx_hwsched_gpu_boot(adreno_dev);
  590. if (ret)
  591. return ret;
  592. kgsl_start_idle_timer(device);
  593. kgsl_pwrscale_wake(device);
  594. set_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
  595. device->pwrctrl.last_stat_updated = ktime_get();
  596. kgsl_pwrctrl_set_state(device, KGSL_STATE_ACTIVE);
  597. return ret;
  598. }
  599. static int a6xx_hwsched_first_boot(struct adreno_device *adreno_dev)
  600. {
  601. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  602. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  603. int ret;
  604. if (test_bit(GMU_PRIV_FIRST_BOOT_DONE, &gmu->flags))
  605. return a6xx_hwsched_boot(adreno_dev);
  606. if (adreno_preemption_feature_set(adreno_dev))
  607. set_bit(ADRENO_DEVICE_PREEMPTION, &adreno_dev->priv);
  608. adreno_hwsched_start(adreno_dev);
  609. ret = a6xx_microcode_read(adreno_dev);
  610. if (ret)
  611. return ret;
  612. ret = a6xx_init(adreno_dev);
  613. if (ret)
  614. return ret;
  615. ret = a6xx_hwsched_gmu_init(adreno_dev);
  616. if (ret)
  617. return ret;
  618. kgsl_pwrctrl_request_state(device, KGSL_STATE_ACTIVE);
  619. ret = a6xx_hwsched_gmu_first_boot(adreno_dev);
  620. if (ret)
  621. return ret;
  622. ret = a6xx_hwsched_gpu_boot(adreno_dev);
  623. if (ret)
  624. return ret;
  625. adreno_get_bus_counters(adreno_dev);
  626. adreno_dev->cooperative_reset = ADRENO_FEATURE(adreno_dev,
  627. ADRENO_COOP_RESET);
  628. set_bit(GMU_PRIV_FIRST_BOOT_DONE, &gmu->flags);
  629. set_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
  630. /*
  631. * There is a possible deadlock scenario during kgsl firmware reading
  632. * (request_firmware) and devfreq update calls. During first boot, kgsl
  633. * device mutex is held and then request_firmware is called for reading
  634. * firmware. request_firmware internally takes dev_pm_qos_mtx lock.
  635. * Whereas in case of devfreq update calls triggered by thermal/bcl or
  636. * devfreq sysfs, it first takes the same dev_pm_qos_mtx lock and then
  637. * tries to take kgsl device mutex as part of get_dev_status/target
  638. * calls. This results in deadlock when both thread are unable to acquire
  639. * the mutex held by other thread. Enable devfreq updates now as we are
  640. * done reading all firmware files.
  641. */
  642. device->pwrscale.devfreq_enabled = true;
  643. device->pwrctrl.last_stat_updated = ktime_get();
  644. kgsl_pwrctrl_set_state(device, KGSL_STATE_ACTIVE);
  645. return 0;
  646. }
  647. static int a6xx_hwsched_power_off(struct adreno_device *adreno_dev)
  648. {
  649. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  650. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  651. int ret;
  652. if (!test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
  653. return 0;
  654. kgsl_pwrctrl_request_state(device, KGSL_STATE_SLUMBER);
  655. ret = a6xx_gmu_oob_set(device, oob_gpu);
  656. if (ret) {
  657. a6xx_gmu_oob_clear(device, oob_gpu);
  658. goto no_gx_power;
  659. }
  660. kgsl_pwrscale_update_stats(device);
  661. /* Save active coresight registers if applicable */
  662. adreno_coresight_stop(adreno_dev);
  663. /* Save physical performance counter values before GPU power down*/
  664. adreno_perfcounter_save(adreno_dev);
  665. adreno_irqctrl(adreno_dev, 0);
  666. a6xx_gmu_oob_clear(device, oob_gpu);
  667. no_gx_power:
  668. kgsl_pwrctrl_irq(device, false);
  669. a6xx_hwsched_gmu_power_off(adreno_dev);
  670. adreno_hwsched_unregister_contexts(adreno_dev);
  671. adreno_llcc_slice_deactivate(adreno_dev);
  672. clear_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
  673. del_timer_sync(&device->idle_timer);
  674. kgsl_pwrscale_sleep(device);
  675. kgsl_pwrctrl_clear_l3_vote(device);
  676. kgsl_pwrctrl_set_state(device, KGSL_STATE_SLUMBER);
  677. return ret;
  678. }
  679. static void hwsched_idle_check(struct work_struct *work)
  680. {
  681. struct kgsl_device *device = container_of(work,
  682. struct kgsl_device, idle_check_ws);
  683. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  684. mutex_lock(&device->mutex);
  685. if (test_bit(GMU_DISABLE_SLUMBER, &device->gmu_core.flags))
  686. goto done;
  687. if (atomic_read(&device->active_cnt) || time_is_after_jiffies(device->idle_jiffies)) {
  688. kgsl_pwrscale_update(device);
  689. kgsl_start_idle_timer(device);
  690. goto done;
  691. }
  692. spin_lock(&device->submit_lock);
  693. if (device->submit_now) {
  694. spin_unlock(&device->submit_lock);
  695. kgsl_pwrscale_update(device);
  696. kgsl_start_idle_timer(device);
  697. goto done;
  698. }
  699. device->skip_inline_submit = true;
  700. spin_unlock(&device->submit_lock);
  701. if (!a6xx_hw_isidle(adreno_dev)) {
  702. dev_err(device->dev, "GPU isn't idle before SLUMBER\n");
  703. gmu_core_fault_snapshot(device);
  704. }
  705. a6xx_hwsched_power_off(adreno_dev);
  706. done:
  707. mutex_unlock(&device->mutex);
  708. }
  709. static int a6xx_hwsched_first_open(struct adreno_device *adreno_dev)
  710. {
  711. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  712. int ret;
  713. /*
  714. * Do the one time settings that need to happen when we
  715. * attempt to boot the gpu the very first time
  716. */
  717. ret = a6xx_hwsched_first_boot(adreno_dev);
  718. if (ret)
  719. return ret;
  720. /*
  721. * A client that does a first_open but never closes the device
  722. * may prevent us from going back to SLUMBER. So trigger the idle
  723. * check by incrementing the active count and immediately releasing it.
  724. */
  725. atomic_inc(&device->active_cnt);
  726. a6xx_hwsched_active_count_put(adreno_dev);
  727. return 0;
  728. }
  729. int a6xx_hwsched_active_count_get(struct adreno_device *adreno_dev)
  730. {
  731. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  732. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  733. int ret = 0;
  734. if (WARN_ON(!mutex_is_locked(&device->mutex)))
  735. return -EINVAL;
  736. if (test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags))
  737. return -EINVAL;
  738. if ((atomic_read(&device->active_cnt) == 0))
  739. ret = a6xx_hwsched_boot(adreno_dev);
  740. if (ret == 0)
  741. atomic_inc(&device->active_cnt);
  742. trace_kgsl_active_count(device,
  743. (unsigned long) __builtin_return_address(0));
  744. return ret;
  745. }
  746. static int a6xx_hwsched_dcvs_set(struct adreno_device *adreno_dev,
  747. int gpu_pwrlevel, int bus_level)
  748. {
  749. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  750. struct kgsl_pwrctrl *pwr = &device->pwrctrl;
  751. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  752. struct hfi_dcvstable_cmd *table = &gmu->hfi.dcvs_table;
  753. struct hfi_gx_bw_perf_vote_cmd req = {
  754. .ack_type = DCVS_ACK_BLOCK,
  755. .freq = INVALID_DCVS_IDX,
  756. .bw = INVALID_DCVS_IDX,
  757. };
  758. int ret;
  759. if (!test_bit(GMU_PRIV_HFI_STARTED, &gmu->flags))
  760. return 0;
  761. /* Do not set to XO and lower GPU clock vote from GMU */
  762. if ((gpu_pwrlevel != INVALID_DCVS_IDX) &&
  763. (gpu_pwrlevel >= table->gpu_level_num - 1)) {
  764. dev_err(&gmu->pdev->dev, "Invalid gpu dcvs request: %d\n",
  765. gpu_pwrlevel);
  766. return -EINVAL;
  767. }
  768. if (gpu_pwrlevel < table->gpu_level_num - 1)
  769. req.freq = table->gpu_level_num - gpu_pwrlevel - 1;
  770. if (bus_level < pwr->ddr_table_count && bus_level > 0)
  771. req.bw = bus_level;
  772. /* GMU will vote for slumber levels through the sleep sequence */
  773. if ((req.freq == INVALID_DCVS_IDX) && (req.bw == INVALID_DCVS_IDX))
  774. return 0;
  775. ret = CMD_MSG_HDR(req, H2F_MSG_GX_BW_PERF_VOTE);
  776. if (ret)
  777. return ret;
  778. ret = a6xx_hfi_send_cmd_async(adreno_dev, &req, sizeof(req));
  779. if (ret) {
  780. dev_err_ratelimited(&gmu->pdev->dev,
  781. "Failed to set GPU perf idx %u, bw idx %u\n",
  782. req.freq, req.bw);
  783. /*
  784. * If this was a dcvs request along side an active gpu, request
  785. * dispatcher based reset and recovery.
  786. */
  787. if (test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
  788. adreno_hwsched_fault(adreno_dev, ADRENO_GMU_FAULT);
  789. }
  790. if (req.freq != INVALID_DCVS_IDX)
  791. a6xx_rdpm_mx_freq_update(gmu,
  792. gmu->hfi.dcvs_table.gx_votes[req.freq].freq);
  793. return ret;
  794. }
  795. static int a6xx_hwsched_clock_set(struct adreno_device *adreno_dev,
  796. u32 pwrlevel)
  797. {
  798. return a6xx_hwsched_dcvs_set(adreno_dev, pwrlevel, INVALID_DCVS_IDX);
  799. }
  800. static void scale_gmu_frequency(struct adreno_device *adreno_dev, int buslevel)
  801. {
  802. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  803. struct kgsl_pwrctrl *pwr = &device->pwrctrl;
  804. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  805. static unsigned long prev_freq;
  806. unsigned long freq = gmu->freqs[0];
  807. if (!gmu->perf_ddr_bw)
  808. return;
  809. /*
  810. * Scale the GMU if DDR is at a CX corner at which GMU can run at
  811. * a higher frequency
  812. */
  813. if (pwr->ddr_table[buslevel] >= gmu->perf_ddr_bw)
  814. freq = gmu->freqs[GMU_MAX_PWRLEVELS - 1];
  815. if (prev_freq == freq)
  816. return;
  817. if (kgsl_clk_set_rate(gmu->clks, gmu->num_clks, "gmu_clk", freq)) {
  818. dev_err(&gmu->pdev->dev, "Unable to set the GMU clock to %ld\n",
  819. freq);
  820. return;
  821. }
  822. a6xx_rdpm_cx_freq_update(gmu, freq / 1000);
  823. trace_kgsl_gmu_pwrlevel(freq, prev_freq);
  824. prev_freq = freq;
  825. }
  826. static int a6xx_hwsched_bus_set(struct adreno_device *adreno_dev, int buslevel,
  827. u32 ab)
  828. {
  829. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  830. struct kgsl_pwrctrl *pwr = &device->pwrctrl;
  831. int ret = 0;
  832. kgsl_icc_set_tag(pwr, buslevel);
  833. if (buslevel != pwr->cur_buslevel) {
  834. ret = a6xx_hwsched_dcvs_set(adreno_dev, INVALID_DCVS_IDX,
  835. buslevel);
  836. if (ret)
  837. return ret;
  838. scale_gmu_frequency(adreno_dev, buslevel);
  839. pwr->cur_buslevel = buslevel;
  840. }
  841. if (ab != pwr->cur_ab) {
  842. icc_set_bw(pwr->icc_path, MBps_to_icc(ab), 0);
  843. pwr->cur_ab = ab;
  844. }
  845. trace_kgsl_buslevel(device, pwr->active_pwrlevel, pwr->cur_buslevel, pwr->cur_ab);
  846. return ret;
  847. }
  848. static int a6xx_hwsched_pm_suspend(struct adreno_device *adreno_dev)
  849. {
  850. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  851. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  852. int ret;
  853. if (test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags))
  854. return 0;
  855. kgsl_pwrctrl_request_state(device, KGSL_STATE_SUSPEND);
  856. /* Halt any new submissions */
  857. reinit_completion(&device->halt_gate);
  858. /**
  859. * Wait for the dispatcher to retire everything by waiting
  860. * for the active count to go to zero.
  861. */
  862. ret = kgsl_active_count_wait(device, 0, msecs_to_jiffies(100));
  863. if (ret) {
  864. dev_err(device->dev, "Timed out waiting for the active count\n");
  865. goto err;
  866. }
  867. ret = adreno_hwsched_idle(adreno_dev);
  868. if (ret)
  869. goto err;
  870. a6xx_hwsched_power_off(adreno_dev);
  871. adreno_get_gpu_halt(adreno_dev);
  872. set_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags);
  873. kgsl_pwrctrl_set_state(device, KGSL_STATE_SUSPEND);
  874. return 0;
  875. err:
  876. adreno_hwsched_start(adreno_dev);
  877. return ret;
  878. }
  879. void a6xx_hwsched_handle_watchdog(struct adreno_device *adreno_dev)
  880. {
  881. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  882. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  883. u32 mask;
  884. /* Temporarily mask the watchdog interrupt to prevent a storm */
  885. gmu_core_regread(device, A6XX_GMU_AO_HOST_INTERRUPT_MASK,
  886. &mask);
  887. gmu_core_regwrite(device, A6XX_GMU_AO_HOST_INTERRUPT_MASK,
  888. (mask | GMU_INT_WDOG_BITE));
  889. a6xx_gmu_send_nmi(device, false);
  890. dev_err_ratelimited(&gmu->pdev->dev,
  891. "GMU watchdog expired interrupt received\n");
  892. adreno_hwsched_fault(adreno_dev, ADRENO_GMU_FAULT);
  893. }
  894. static void a6xx_hwsched_pm_resume(struct adreno_device *adreno_dev)
  895. {
  896. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  897. if (WARN(!test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags),
  898. "resume invoked without a suspend\n"))
  899. return;
  900. adreno_put_gpu_halt(adreno_dev);
  901. adreno_hwsched_start(adreno_dev);
  902. clear_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags);
  903. }
  904. static void a6xx_hwsched_drain_ctxt_unregister(struct adreno_device *adreno_dev)
  905. {
  906. struct a6xx_hwsched_hfi *hfi = to_a6xx_hwsched_hfi(adreno_dev);
  907. struct pending_cmd *cmd = NULL;
  908. read_lock(&hfi->msglock);
  909. list_for_each_entry(cmd, &hfi->msglist, node) {
  910. if (MSG_HDR_GET_ID(cmd->sent_hdr) == H2F_MSG_UNREGISTER_CONTEXT)
  911. complete(&cmd->complete);
  912. }
  913. read_unlock(&hfi->msglock);
  914. }
  915. int a6xx_hwsched_reset_replay(struct adreno_device *adreno_dev)
  916. {
  917. struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
  918. int ret;
  919. /*
  920. * Any pending context unregister packets will be lost
  921. * since we hard reset the GMU. This means any threads waiting
  922. * for context unregister hfi ack will timeout. Wake them
  923. * to avoid false positive ack timeout messages later.
  924. */
  925. a6xx_hwsched_drain_ctxt_unregister(adreno_dev);
  926. adreno_hwsched_unregister_contexts(adreno_dev);
  927. if (!test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
  928. return 0;
  929. a6xx_disable_gpu_irq(adreno_dev);
  930. a6xx_gmu_irq_disable(adreno_dev);
  931. a6xx_hwsched_hfi_stop(adreno_dev);
  932. a6xx_gmu_suspend(adreno_dev);
  933. adreno_llcc_slice_deactivate(adreno_dev);
  934. clear_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
  935. ret = a6xx_hwsched_boot(adreno_dev);
  936. if (!ret)
  937. adreno_hwsched_replay(adreno_dev);
  938. BUG_ON(ret);
  939. return ret;
  940. }
  941. const struct adreno_power_ops a6xx_hwsched_power_ops = {
  942. .first_open = a6xx_hwsched_first_open,
  943. .last_close = a6xx_hwsched_power_off,
  944. .active_count_get = a6xx_hwsched_active_count_get,
  945. .active_count_put = a6xx_hwsched_active_count_put,
  946. .touch_wakeup = a6xx_hwsched_touch_wakeup,
  947. .pm_suspend = a6xx_hwsched_pm_suspend,
  948. .pm_resume = a6xx_hwsched_pm_resume,
  949. .gpu_clock_set = a6xx_hwsched_clock_set,
  950. .gpu_bus_set = a6xx_hwsched_bus_set,
  951. };
  952. const struct adreno_hwsched_ops a6xx_hwsched_ops = {
  953. .submit_drawobj = a6xx_hwsched_submit_drawobj,
  954. .preempt_count = a6xx_hwsched_preempt_count_get,
  955. };
  956. int a6xx_hwsched_probe(struct platform_device *pdev,
  957. u32 chipid, const struct adreno_gpu_core *gpucore)
  958. {
  959. struct adreno_device *adreno_dev;
  960. struct kgsl_device *device;
  961. struct a6xx_hwsched_device *a6xx_hwsched_dev;
  962. int ret;
  963. a6xx_hwsched_dev = devm_kzalloc(&pdev->dev, sizeof(*a6xx_hwsched_dev),
  964. GFP_KERNEL);
  965. if (!a6xx_hwsched_dev)
  966. return -ENOMEM;
  967. adreno_dev = &a6xx_hwsched_dev->a6xx_dev.adreno_dev;
  968. adreno_dev->hwsched_enabled = true;
  969. adreno_dev->irq_mask = A6XX_HWSCHED_INT_MASK;
  970. ret = a6xx_probe_common(pdev, adreno_dev, chipid, gpucore);
  971. if (ret)
  972. return ret;
  973. device = KGSL_DEVICE(adreno_dev);
  974. INIT_WORK(&device->idle_check_ws, hwsched_idle_check);
  975. timer_setup(&device->idle_timer, hwsched_idle_timer, 0);
  976. return adreno_hwsched_init(adreno_dev, &a6xx_hwsched_ops);
  977. }
  978. int a6xx_hwsched_add_to_minidump(struct adreno_device *adreno_dev)
  979. {
  980. struct a6xx_device *a6xx_dev = container_of(adreno_dev,
  981. struct a6xx_device, adreno_dev);
  982. struct a6xx_hwsched_device *a6xx_hwsched = container_of(a6xx_dev,
  983. struct a6xx_hwsched_device, a6xx_dev);
  984. struct a6xx_hwsched_hfi *hw_hfi = &a6xx_hwsched->hwsched_hfi;
  985. int ret, i;
  986. ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev, KGSL_HWSCHED_DEVICE,
  987. (void *)(a6xx_hwsched), sizeof(struct a6xx_hwsched_device));
  988. if (ret)
  989. return ret;
  990. if (!IS_ERR_OR_NULL(a6xx_dev->gmu.gmu_log)) {
  991. ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
  992. KGSL_GMU_LOG_ENTRY,
  993. a6xx_dev->gmu.gmu_log->hostptr,
  994. a6xx_dev->gmu.gmu_log->size);
  995. if (ret)
  996. return ret;
  997. }
  998. if (!IS_ERR_OR_NULL(a6xx_dev->gmu.hfi.hfi_mem)) {
  999. ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
  1000. KGSL_HFIMEM_ENTRY,
  1001. a6xx_dev->gmu.hfi.hfi_mem->hostptr,
  1002. a6xx_dev->gmu.hfi.hfi_mem->size);
  1003. if (ret)
  1004. return ret;
  1005. }
  1006. if (!IS_ERR_OR_NULL(a6xx_dev->gmu.vrb)) {
  1007. ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
  1008. KGSL_GMU_VRB_ENTRY,
  1009. a6xx_dev->gmu.vrb->hostptr,
  1010. a6xx_dev->gmu.vrb->size);
  1011. if (ret)
  1012. return ret;
  1013. }
  1014. if (!IS_ERR_OR_NULL(a6xx_dev->gmu.dump_mem)) {
  1015. ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
  1016. KGSL_GMU_DUMPMEM_ENTRY,
  1017. a6xx_dev->gmu.dump_mem->hostptr,
  1018. a6xx_dev->gmu.dump_mem->size);
  1019. if (ret)
  1020. return ret;
  1021. }
  1022. if (!IS_ERR_OR_NULL(a6xx_dev->gmu.trace.md)) {
  1023. ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
  1024. KGSL_GMU_TRACE_ENTRY,
  1025. a6xx_dev->gmu.trace.md->hostptr,
  1026. a6xx_dev->gmu.trace.md->size);
  1027. if (ret)
  1028. return ret;
  1029. }
  1030. /* Dump HFI hwsched global mem alloc entries */
  1031. for (i = 0; i < hw_hfi->mem_alloc_entries; i++) {
  1032. struct hfi_mem_alloc_entry *entry = &hw_hfi->mem_alloc_table[i];
  1033. char hfi_minidump_str[MAX_VA_MINIDUMP_STR_LEN] = {0};
  1034. u32 rb_id = 0;
  1035. if (!hfi_get_minidump_string(entry->desc.mem_kind,
  1036. &hfi_minidump_str[0],
  1037. sizeof(hfi_minidump_str), &rb_id)) {
  1038. ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
  1039. hfi_minidump_str,
  1040. entry->md->hostptr,
  1041. entry->md->size);
  1042. if (ret)
  1043. return ret;
  1044. }
  1045. }
  1046. if (!IS_ERR_OR_NULL(hw_hfi->big_ib)) {
  1047. ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
  1048. KGSL_HFI_BIG_IB_ENTRY,
  1049. hw_hfi->big_ib->hostptr,
  1050. hw_hfi->big_ib->size);
  1051. if (ret)
  1052. return ret;
  1053. }
  1054. if (!IS_ERR_OR_NULL(hw_hfi->big_ib_recurring))
  1055. ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
  1056. KGSL_HFI_BIG_IB_REC_ENTRY,
  1057. hw_hfi->big_ib_recurring->hostptr,
  1058. hw_hfi->big_ib_recurring->size);
  1059. return ret;
  1060. }