adreno_gen7.c 67 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Copyright (c) 2021, The Linux Foundation. All rights reserved.
  4. * Copyright (c) 2022-2024 Qualcomm Innovation Center, Inc. All rights reserved.
  5. */
  6. #include <linux/debugfs.h>
  7. #include <linux/io.h>
  8. #include <linux/of.h>
  9. #include <linux/of_fdt.h>
  10. #include <linux/of_device.h>
  11. #include <linux/regulator/consumer.h>
  12. #include <linux/soc/qcom/llcc-qcom.h>
  13. #include <soc/qcom/of_common.h>
  14. #include "adreno.h"
  15. #include "adreno_gen7.h"
  16. #include "adreno_gen7_hwsched.h"
  17. #include "adreno_pm4types.h"
  18. #include "adreno_trace.h"
  19. #include "kgsl_pwrscale.h"
  20. #include "kgsl_trace.h"
  21. #include "kgsl_util.h"
  22. /* IFPC & Preemption static powerup restore list */
  23. static const u32 gen7_pwrup_reglist[] = {
  24. GEN7_UCHE_TRAP_BASE_LO,
  25. GEN7_UCHE_TRAP_BASE_HI,
  26. GEN7_UCHE_WRITE_THRU_BASE_LO,
  27. GEN7_UCHE_WRITE_THRU_BASE_HI,
  28. GEN7_UCHE_GMEM_RANGE_MIN_LO,
  29. GEN7_UCHE_GMEM_RANGE_MIN_HI,
  30. GEN7_UCHE_GMEM_RANGE_MAX_LO,
  31. GEN7_UCHE_GMEM_RANGE_MAX_HI,
  32. GEN7_UCHE_CACHE_WAYS,
  33. GEN7_UCHE_MODE_CNTL,
  34. GEN7_RB_NC_MODE_CNTL,
  35. GEN7_RB_CMP_DBG_ECO_CNTL,
  36. GEN7_GRAS_NC_MODE_CNTL,
  37. GEN7_RB_CONTEXT_SWITCH_GMEM_SAVE_RESTORE,
  38. GEN7_UCHE_GBIF_GX_CONFIG,
  39. GEN7_UCHE_CLIENT_PF,
  40. GEN7_TPL1_DBG_ECO_CNTL1,
  41. };
  42. static const u32 gen7_0_0_pwrup_reglist[] = {
  43. GEN7_UCHE_TRAP_BASE_LO,
  44. GEN7_UCHE_TRAP_BASE_HI,
  45. GEN7_UCHE_WRITE_THRU_BASE_LO,
  46. GEN7_UCHE_WRITE_THRU_BASE_HI,
  47. GEN7_UCHE_GMEM_RANGE_MIN_LO,
  48. GEN7_UCHE_GMEM_RANGE_MIN_HI,
  49. GEN7_UCHE_GMEM_RANGE_MAX_LO,
  50. GEN7_UCHE_GMEM_RANGE_MAX_HI,
  51. GEN7_UCHE_CACHE_WAYS,
  52. GEN7_UCHE_MODE_CNTL,
  53. GEN7_RB_NC_MODE_CNTL,
  54. GEN7_RB_CMP_DBG_ECO_CNTL,
  55. GEN7_SP_NC_MODE_CNTL,
  56. GEN7_GRAS_NC_MODE_CNTL,
  57. GEN7_RB_CONTEXT_SWITCH_GMEM_SAVE_RESTORE,
  58. GEN7_UCHE_GBIF_GX_CONFIG,
  59. GEN7_UCHE_CLIENT_PF,
  60. };
  61. /* IFPC only static powerup restore list */
  62. static const u32 gen7_ifpc_pwrup_reglist[] = {
  63. GEN7_TPL1_NC_MODE_CNTL,
  64. GEN7_SP_NC_MODE_CNTL,
  65. GEN7_CP_DBG_ECO_CNTL,
  66. GEN7_CP_PROTECT_CNTL,
  67. GEN7_CP_LPAC_PROTECT_CNTL,
  68. GEN7_CP_PROTECT_REG,
  69. GEN7_CP_PROTECT_REG+1,
  70. GEN7_CP_PROTECT_REG+2,
  71. GEN7_CP_PROTECT_REG+3,
  72. GEN7_CP_PROTECT_REG+4,
  73. GEN7_CP_PROTECT_REG+5,
  74. GEN7_CP_PROTECT_REG+6,
  75. GEN7_CP_PROTECT_REG+7,
  76. GEN7_CP_PROTECT_REG+8,
  77. GEN7_CP_PROTECT_REG+9,
  78. GEN7_CP_PROTECT_REG+10,
  79. GEN7_CP_PROTECT_REG+11,
  80. GEN7_CP_PROTECT_REG+12,
  81. GEN7_CP_PROTECT_REG+13,
  82. GEN7_CP_PROTECT_REG+14,
  83. GEN7_CP_PROTECT_REG+15,
  84. GEN7_CP_PROTECT_REG+16,
  85. GEN7_CP_PROTECT_REG+17,
  86. GEN7_CP_PROTECT_REG+18,
  87. GEN7_CP_PROTECT_REG+19,
  88. GEN7_CP_PROTECT_REG+20,
  89. GEN7_CP_PROTECT_REG+21,
  90. GEN7_CP_PROTECT_REG+22,
  91. GEN7_CP_PROTECT_REG+23,
  92. GEN7_CP_PROTECT_REG+24,
  93. GEN7_CP_PROTECT_REG+25,
  94. GEN7_CP_PROTECT_REG+26,
  95. GEN7_CP_PROTECT_REG+27,
  96. GEN7_CP_PROTECT_REG+28,
  97. GEN7_CP_PROTECT_REG+29,
  98. GEN7_CP_PROTECT_REG+30,
  99. GEN7_CP_PROTECT_REG+31,
  100. GEN7_CP_PROTECT_REG+32,
  101. GEN7_CP_PROTECT_REG+33,
  102. GEN7_CP_PROTECT_REG+34,
  103. GEN7_CP_PROTECT_REG+35,
  104. GEN7_CP_PROTECT_REG+36,
  105. GEN7_CP_PROTECT_REG+37,
  106. GEN7_CP_PROTECT_REG+38,
  107. GEN7_CP_PROTECT_REG+39,
  108. GEN7_CP_PROTECT_REG+40,
  109. GEN7_CP_PROTECT_REG+41,
  110. GEN7_CP_PROTECT_REG+42,
  111. GEN7_CP_PROTECT_REG+43,
  112. GEN7_CP_PROTECT_REG+44,
  113. GEN7_CP_PROTECT_REG+45,
  114. GEN7_CP_PROTECT_REG+46,
  115. GEN7_CP_PROTECT_REG+47,
  116. GEN7_CP_AHB_CNTL,
  117. };
  118. static const u32 gen7_0_0_ifpc_pwrup_reglist[] = {
  119. GEN7_TPL1_NC_MODE_CNTL,
  120. GEN7_CP_DBG_ECO_CNTL,
  121. GEN7_CP_PROTECT_CNTL,
  122. GEN7_CP_LPAC_PROTECT_CNTL,
  123. GEN7_CP_PROTECT_REG,
  124. GEN7_CP_PROTECT_REG+1,
  125. GEN7_CP_PROTECT_REG+2,
  126. GEN7_CP_PROTECT_REG+3,
  127. GEN7_CP_PROTECT_REG+4,
  128. GEN7_CP_PROTECT_REG+5,
  129. GEN7_CP_PROTECT_REG+6,
  130. GEN7_CP_PROTECT_REG+7,
  131. GEN7_CP_PROTECT_REG+8,
  132. GEN7_CP_PROTECT_REG+9,
  133. GEN7_CP_PROTECT_REG+10,
  134. GEN7_CP_PROTECT_REG+11,
  135. GEN7_CP_PROTECT_REG+12,
  136. GEN7_CP_PROTECT_REG+13,
  137. GEN7_CP_PROTECT_REG+14,
  138. GEN7_CP_PROTECT_REG+15,
  139. GEN7_CP_PROTECT_REG+16,
  140. GEN7_CP_PROTECT_REG+17,
  141. GEN7_CP_PROTECT_REG+18,
  142. GEN7_CP_PROTECT_REG+19,
  143. GEN7_CP_PROTECT_REG+20,
  144. GEN7_CP_PROTECT_REG+21,
  145. GEN7_CP_PROTECT_REG+22,
  146. GEN7_CP_PROTECT_REG+23,
  147. GEN7_CP_PROTECT_REG+24,
  148. GEN7_CP_PROTECT_REG+25,
  149. GEN7_CP_PROTECT_REG+26,
  150. GEN7_CP_PROTECT_REG+27,
  151. GEN7_CP_PROTECT_REG+28,
  152. GEN7_CP_PROTECT_REG+29,
  153. GEN7_CP_PROTECT_REG+30,
  154. GEN7_CP_PROTECT_REG+31,
  155. GEN7_CP_PROTECT_REG+32,
  156. GEN7_CP_PROTECT_REG+33,
  157. GEN7_CP_PROTECT_REG+34,
  158. GEN7_CP_PROTECT_REG+35,
  159. GEN7_CP_PROTECT_REG+36,
  160. GEN7_CP_PROTECT_REG+37,
  161. GEN7_CP_PROTECT_REG+38,
  162. GEN7_CP_PROTECT_REG+39,
  163. GEN7_CP_PROTECT_REG+40,
  164. GEN7_CP_PROTECT_REG+41,
  165. GEN7_CP_PROTECT_REG+42,
  166. GEN7_CP_PROTECT_REG+43,
  167. GEN7_CP_PROTECT_REG+44,
  168. GEN7_CP_PROTECT_REG+45,
  169. GEN7_CP_PROTECT_REG+46,
  170. GEN7_CP_PROTECT_REG+47,
  171. GEN7_CP_AHB_CNTL,
  172. };
  173. /* Gen7_9_x IFPC only static powerup restore list */
  174. static const u32 gen7_9_x_ifpc_pwrup_reglist[] = {
  175. GEN7_TPL1_BICUBIC_WEIGHTS_TABLE_1,
  176. GEN7_TPL1_BICUBIC_WEIGHTS_TABLE_2,
  177. GEN7_TPL1_BICUBIC_WEIGHTS_TABLE_3,
  178. GEN7_TPL1_BICUBIC_WEIGHTS_TABLE_4,
  179. };
  180. static int acd_calibrate_set(void *data, u64 val)
  181. {
  182. struct kgsl_device *device = data;
  183. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  184. struct gen7_gmu_device *gmu = to_gen7_gmu(adreno_dev);
  185. u32 debug_val = (u32) val;
  186. int ret;
  187. mutex_lock(&device->mutex);
  188. ret = adreno_active_count_get(adreno_dev);
  189. if (ret)
  190. goto err;
  191. ret = gen7_hfi_send_set_value(adreno_dev, HFI_VALUE_DBG, F_PWR_ACD_CALIBRATE, debug_val);
  192. if (!ret)
  193. gmu->acd_debug_val = debug_val;
  194. adreno_active_count_put(adreno_dev);
  195. err:
  196. mutex_unlock(&device->mutex);
  197. return ret;
  198. }
  199. static int acd_calibrate_get(void *data, u64 *val)
  200. {
  201. struct kgsl_device *device = data;
  202. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  203. struct gen7_gmu_device *gmu = to_gen7_gmu(adreno_dev);
  204. *val = (u64) gmu->acd_debug_val;
  205. return 0;
  206. }
  207. DEFINE_DEBUGFS_ATTRIBUTE(acd_cal_fops, acd_calibrate_get, acd_calibrate_set, "%llu\n");
  208. void gen7_cp_init_cmds(struct adreno_device *adreno_dev, u32 *cmds)
  209. {
  210. u32 i = 0, mask = 0;
  211. /* Disable concurrent binning before sending CP init */
  212. cmds[i++] = cp_type7_packet(CP_THREAD_CONTROL, 1);
  213. cmds[i++] = BIT(27);
  214. /* Use multiple HW contexts */
  215. mask |= BIT(0);
  216. /* Enable error detection */
  217. mask |= BIT(1);
  218. /* Set default reset state */
  219. mask |= BIT(3);
  220. /* Disable save/restore of performance counters across preemption */
  221. mask |= BIT(6);
  222. /* Enable the register init list with the spinlock */
  223. mask |= BIT(8);
  224. /* By default DMS is enabled from CP side, disable it if not supported */
  225. if (!adreno_dev->dms_enabled)
  226. mask |= BIT(11);
  227. cmds[i++] = cp_type7_packet(CP_ME_INIT, 7);
  228. /* Enabled ordinal mask */
  229. cmds[i++] = mask;
  230. cmds[i++] = 0x00000003; /* Set number of HW contexts */
  231. cmds[i++] = 0x20000000; /* Enable error detection */
  232. cmds[i++] = 0x00000002; /* Operation mode mask */
  233. /* Register initialization list with spinlock */
  234. cmds[i++] = lower_32_bits(adreno_dev->pwrup_reglist->gpuaddr);
  235. cmds[i++] = upper_32_bits(adreno_dev->pwrup_reglist->gpuaddr);
  236. /*
  237. * Gen7 targets with concurrent binning are expected to have a dynamic
  238. * power up list with triplets which contains the pipe id in it.
  239. * Bit 31 of POWER_UP_REGISTER_LIST_LENGTH is reused here to let CP
  240. * know if the power up contains the triplets. If
  241. * REGISTER_INIT_LIST_WITH_SPINLOCK is set and bit 31 below is set,
  242. * CP expects a dynamic list with triplets.
  243. */
  244. cmds[i++] = BIT(31);
  245. }
  246. int gen7_fenced_write(struct adreno_device *adreno_dev, u32 offset,
  247. u32 value, u32 mask)
  248. {
  249. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  250. const struct adreno_gpudev *gpudev = ADRENO_GPU_DEVICE(adreno_dev);
  251. unsigned int status, i;
  252. u64 ts1, ts2;
  253. kgsl_regwrite(device, offset, value);
  254. ts1 = gpudev->read_alwayson(adreno_dev);
  255. for (i = 0; i < GMU_CORE_LONG_WAKEUP_RETRY_LIMIT; i++) {
  256. /*
  257. * Make sure the previous register write is posted before
  258. * checking the fence status
  259. */
  260. mb();
  261. gmu_core_regread(device, GEN7_GMU_AHB_FENCE_STATUS, &status);
  262. /*
  263. * If !writedropped0/1, then the write to fenced register
  264. * was successful
  265. */
  266. if (!(status & mask))
  267. break;
  268. /* Wait a small amount of time before trying again */
  269. udelay(GMU_CORE_WAKEUP_DELAY_US);
  270. /* Try to write the fenced register again */
  271. kgsl_regwrite(device, offset, value);
  272. }
  273. if (i < GMU_CORE_SHORT_WAKEUP_RETRY_LIMIT)
  274. return 0;
  275. if (i == GMU_CORE_LONG_WAKEUP_RETRY_LIMIT) {
  276. ts2 = gpudev->read_alwayson(adreno_dev);
  277. dev_err(device->dev,
  278. "Timed out waiting %d usecs to write fenced register 0x%x, timestamps: %llx %llx\n",
  279. i * GMU_CORE_WAKEUP_DELAY_US, offset, ts1, ts2);
  280. return -ETIMEDOUT;
  281. }
  282. dev_info(device->dev,
  283. "Waited %d usecs to write fenced register 0x%x\n",
  284. i * GMU_CORE_WAKEUP_DELAY_US, offset);
  285. return 0;
  286. }
  287. int gen7_init(struct adreno_device *adreno_dev)
  288. {
  289. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  290. const struct adreno_gen7_core *gen7_core = to_gen7_core(adreno_dev);
  291. u64 freq = gen7_core->gmu_hub_clk_freq;
  292. adreno_dev->highest_bank_bit = gen7_core->highest_bank_bit;
  293. adreno_dev->gmu_hub_clk_freq = freq ? freq : 150000000;
  294. adreno_dev->ahb_timeout_val = adreno_get_ahb_timeout_val(adreno_dev,
  295. gen7_core->noc_timeout_us);
  296. adreno_dev->bcl_data = gen7_core->bcl_data;
  297. adreno_dev->cooperative_reset = ADRENO_FEATURE(adreno_dev,
  298. ADRENO_COOP_RESET);
  299. /* If the memory type is DDR 4, override the existing configuration */
  300. if (of_fdt_get_ddrtype() == 0x7)
  301. adreno_dev->highest_bank_bit = 14;
  302. gen7_crashdump_init(adreno_dev);
  303. return adreno_allocate_global(device, &adreno_dev->pwrup_reglist,
  304. PAGE_SIZE, 0, 0, KGSL_MEMDESC_PRIVILEGED,
  305. "powerup_register_list");
  306. }
  307. #define CX_TIMER_INIT_SAMPLES 16
  308. void gen7_cx_timer_init(struct adreno_device *adreno_dev)
  309. {
  310. u64 seed_val, tmr, skew = 0;
  311. int i;
  312. unsigned long flags;
  313. /*
  314. * Only gen7_9_x has the CX timer. Set it up during first boot or
  315. * after suspend resume.
  316. */
  317. if (!adreno_is_gen7_9_x(adreno_dev) ||
  318. test_bit(ADRENO_DEVICE_CX_TIMER_INITIALIZED, &adreno_dev->priv))
  319. return;
  320. /* Disable irqs to get accurate timings */
  321. local_irq_save(flags);
  322. /* Calculate the overhead of timer reads and register writes */
  323. for (i = 0; i < CX_TIMER_INIT_SAMPLES; i++) {
  324. u64 tmr1, tmr2, tmr3;
  325. /* Measure time for two reads of the CPU timer */
  326. tmr1 = arch_timer_read_counter();
  327. tmr2 = arch_timer_read_counter();
  328. /* Write to the register and time it */
  329. adreno_cx_misc_regwrite(adreno_dev,
  330. GEN7_GPU_CX_MISC_AO_COUNTER_LO,
  331. lower_32_bits(tmr2));
  332. adreno_cx_misc_regwrite(adreno_dev,
  333. GEN7_GPU_CX_MISC_AO_COUNTER_HI,
  334. upper_32_bits(tmr2));
  335. /* Barrier to make sure the write completes before timing it */
  336. mb();
  337. tmr3 = arch_timer_read_counter();
  338. /* Calculate difference between register write and CPU timer */
  339. skew += (tmr3 - tmr2) - (tmr2 - tmr1);
  340. }
  341. local_irq_restore(flags);
  342. /* Get the average over all our readings, to the closest integer */
  343. skew = (skew + CX_TIMER_INIT_SAMPLES / 2) / CX_TIMER_INIT_SAMPLES;
  344. local_irq_save(flags);
  345. tmr = arch_timer_read_counter();
  346. seed_val = tmr + skew;
  347. /* Seed the GPU CX counter with the adjusted timer */
  348. adreno_cx_misc_regwrite(adreno_dev,
  349. GEN7_GPU_CX_MISC_AO_COUNTER_LO, lower_32_bits(seed_val));
  350. adreno_cx_misc_regwrite(adreno_dev,
  351. GEN7_GPU_CX_MISC_AO_COUNTER_HI, upper_32_bits(seed_val));
  352. local_irq_restore(flags);
  353. set_bit(ADRENO_DEVICE_CX_TIMER_INITIALIZED, &adreno_dev->priv);
  354. }
  355. void gen7_get_gpu_feature_info(struct adreno_device *adreno_dev)
  356. {
  357. u32 feature_fuse = 0;
  358. /* Only Gen7_9_x has the HW feature information */
  359. if (!adreno_is_gen7_9_x(adreno_dev))
  360. return;
  361. /* Get HW feature soft fuse value */
  362. adreno_cx_misc_regread(adreno_dev, GEN7_GPU_CX_MISC_SW_FUSE_VALUE,
  363. &feature_fuse);
  364. adreno_dev->fastblend_enabled = feature_fuse & BIT(GEN7_FASTBLEND_SW_FUSE);
  365. adreno_dev->raytracing_enabled = feature_fuse & BIT(GEN7_RAYTRACING_SW_FUSE);
  366. /* If software enables LPAC without HW support, disable it */
  367. if (ADRENO_FEATURE(adreno_dev, ADRENO_LPAC))
  368. adreno_dev->lpac_enabled = feature_fuse & BIT(GEN7_LPAC_SW_FUSE);
  369. adreno_dev->feature_fuse = feature_fuse;
  370. }
  371. #define GEN7_PROTECT_DEFAULT (BIT(0) | BIT(1) | BIT(3))
  372. static void gen7_protect_init(struct adreno_device *adreno_dev)
  373. {
  374. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  375. const struct adreno_gen7_core *gen7_core = to_gen7_core(adreno_dev);
  376. const struct gen7_protected_regs *regs = gen7_core->protected_regs;
  377. int i;
  378. /*
  379. * Enable access protection to privileged registers, fault on an access
  380. * protect violation and select the last span to protect from the start
  381. * address all the way to the end of the register address space
  382. */
  383. kgsl_regwrite(device, GEN7_CP_PROTECT_CNTL, GEN7_PROTECT_DEFAULT);
  384. if (adreno_dev->lpac_enabled)
  385. kgsl_regwrite(device, GEN7_CP_LPAC_PROTECT_CNTL, GEN7_PROTECT_DEFAULT);
  386. /* Program each register defined by the core definition */
  387. for (i = 0; regs[i].reg; i++) {
  388. u32 count;
  389. /*
  390. * This is the offset of the end register as counted from the
  391. * start, i.e. # of registers in the range - 1
  392. */
  393. count = regs[i].end - regs[i].start;
  394. kgsl_regwrite(device, regs[i].reg,
  395. FIELD_PREP(GENMASK(17, 0), regs[i].start) |
  396. FIELD_PREP(GENMASK(30, 18), count) |
  397. FIELD_PREP(BIT(31), regs[i].noaccess));
  398. }
  399. }
  400. #define RBBM_CLOCK_CNTL_ON 0x8aa8aa82
  401. static void gen7_hwcg_set(struct adreno_device *adreno_dev, bool on)
  402. {
  403. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  404. const struct adreno_gen7_core *gen7_core = to_gen7_core(adreno_dev);
  405. unsigned int value;
  406. int i;
  407. if (!adreno_dev->hwcg_enabled)
  408. on = false;
  409. for (i = 0; i < gen7_core->ao_hwcg_count; i++)
  410. gmu_core_regwrite(device, gen7_core->ao_hwcg[i].offset,
  411. on ? gen7_core->ao_hwcg[i].val : 0);
  412. if (!gen7_core->hwcg) {
  413. kgsl_regwrite(device, GEN7_RBBM_CLOCK_CNTL_GLOBAL, 1);
  414. kgsl_regwrite(device, GEN7_RBBM_CGC_GLOBAL_LOAD_CMD, on ? 1 : 0);
  415. if (on) {
  416. u32 retry = 3;
  417. kgsl_regwrite(device, GEN7_RBBM_CGC_P2S_TRIG_CMD, 1);
  418. /* Poll for the TXDONE:BIT(0) status */
  419. do {
  420. /* Wait for small amount of time for TXDONE status*/
  421. udelay(1);
  422. kgsl_regread(device, GEN7_RBBM_CGC_P2S_STATUS, &value);
  423. } while (!(value & BIT(0)) && --retry);
  424. if (!(value & BIT(0))) {
  425. dev_err(device->dev, "RBBM_CGC_P2S_STATUS:TXDONE Poll failed\n");
  426. kgsl_device_snapshot(device, NULL, NULL, false);
  427. return;
  428. }
  429. kgsl_regwrite(device, GEN7_RBBM_CLOCK_CNTL_GLOBAL, 0);
  430. }
  431. return;
  432. }
  433. kgsl_regread(device, GEN7_RBBM_CLOCK_CNTL, &value);
  434. if (value == RBBM_CLOCK_CNTL_ON && on)
  435. return;
  436. if (value == 0 && !on)
  437. return;
  438. for (i = 0; i < gen7_core->hwcg_count; i++)
  439. kgsl_regwrite(device, gen7_core->hwcg[i].offset,
  440. on ? gen7_core->hwcg[i].val : 0);
  441. /* enable top level HWCG */
  442. kgsl_regwrite(device, GEN7_RBBM_CLOCK_CNTL,
  443. on ? RBBM_CLOCK_CNTL_ON : 0);
  444. }
  445. static void gen7_patch_pwrup_reglist(struct adreno_device *adreno_dev)
  446. {
  447. struct adreno_reglist_list reglist[3];
  448. void *ptr = adreno_dev->pwrup_reglist->hostptr;
  449. struct cpu_gpu_lock *lock = ptr;
  450. u32 items = 0, i, j;
  451. u32 *dest = ptr + sizeof(*lock);
  452. /* Static IFPC-only registers */
  453. if (adreno_is_gen7_0_x_family(adreno_dev)) {
  454. reglist[items].regs = gen7_0_0_ifpc_pwrup_reglist;
  455. reglist[items].count = ARRAY_SIZE(gen7_0_0_ifpc_pwrup_reglist);
  456. } else {
  457. reglist[items].regs = gen7_ifpc_pwrup_reglist;
  458. reglist[items].count = ARRAY_SIZE(gen7_ifpc_pwrup_reglist);
  459. }
  460. lock->ifpc_list_len = reglist[items].count;
  461. items++;
  462. if (adreno_is_gen7_9_x(adreno_dev)) {
  463. reglist[items].regs = gen7_9_x_ifpc_pwrup_reglist;
  464. reglist[items].count = ARRAY_SIZE(gen7_9_x_ifpc_pwrup_reglist);
  465. lock->ifpc_list_len += reglist[items].count;
  466. items++;
  467. }
  468. /* Static IFPC + preemption registers */
  469. if (adreno_is_gen7_0_x_family(adreno_dev)) {
  470. reglist[items].regs = gen7_0_0_pwrup_reglist;
  471. reglist[items].count = ARRAY_SIZE(gen7_0_0_pwrup_reglist);
  472. } else {
  473. reglist[items].regs = gen7_pwrup_reglist;
  474. reglist[items].count = ARRAY_SIZE(gen7_pwrup_reglist);
  475. }
  476. lock->preemption_list_len = reglist[items].count;
  477. items++;
  478. /*
  479. * For each entry in each of the lists, write the offset and the current
  480. * register value into the GPU buffer
  481. */
  482. for (i = 0; i < items; i++) {
  483. const u32 *r = reglist[i].regs;
  484. for (j = 0; j < reglist[i].count; j++) {
  485. *dest++ = r[j];
  486. kgsl_regread(KGSL_DEVICE(adreno_dev), r[j], dest++);
  487. }
  488. }
  489. /*
  490. * The overall register list is composed of
  491. * 1. Static IFPC-only registers
  492. * 2. Static IFPC + preemption registers
  493. * 3. Dynamic IFPC + preemption registers (ex: perfcounter selects)
  494. *
  495. * The first two lists are static. Size of these lists are stored as
  496. * number of pairs in ifpc_list_len and preemption_list_len
  497. * respectively. With concurrent binning, Some of the perfcounter
  498. * registers being virtualized, CP needs to know the pipe id to program
  499. * the aperture inorder to restore the same. Thus, third list is a
  500. * dynamic list with triplets as
  501. * (<aperture, shifted 12 bits> <address> <data>), and the length is
  502. * stored as number for triplets in dynamic_list_len.
  503. */
  504. lock->dynamic_list_len = 0;
  505. }
  506. /* _llc_configure_gpu_scid() - Program the sub-cache ID for all GPU blocks */
  507. static void _llc_configure_gpu_scid(struct adreno_device *adreno_dev)
  508. {
  509. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  510. u32 gpu_scid;
  511. if (IS_ERR_OR_NULL(adreno_dev->gpu_llc_slice) ||
  512. !adreno_dev->gpu_llc_slice_enable)
  513. return;
  514. if (llcc_slice_activate(adreno_dev->gpu_llc_slice))
  515. return;
  516. gpu_scid = llcc_get_slice_id(adreno_dev->gpu_llc_slice);
  517. /* 6 blocks at 5 bits per block */
  518. kgsl_regwrite(device, GEN7_GBIF_SCACHE_CNTL1,
  519. FIELD_PREP(GENMASK(29, 25), gpu_scid) |
  520. FIELD_PREP(GENMASK(24, 20), gpu_scid) |
  521. FIELD_PREP(GENMASK(19, 15), gpu_scid) |
  522. FIELD_PREP(GENMASK(14, 10), gpu_scid) |
  523. FIELD_PREP(GENMASK(9, 5), gpu_scid) |
  524. FIELD_PREP(GENMASK(4, 0), gpu_scid));
  525. kgsl_regwrite(device, GEN7_GBIF_SCACHE_CNTL0,
  526. FIELD_PREP(GENMASK(14, 10), gpu_scid) | BIT(8));
  527. }
  528. static void _llc_gpuhtw_slice_activate(struct adreno_device *adreno_dev)
  529. {
  530. if (IS_ERR_OR_NULL(adreno_dev->gpuhtw_llc_slice) ||
  531. !adreno_dev->gpuhtw_llc_slice_enable)
  532. return;
  533. llcc_slice_activate(adreno_dev->gpuhtw_llc_slice);
  534. }
  535. static void _set_secvid(struct kgsl_device *device)
  536. {
  537. kgsl_regwrite(device, GEN7_RBBM_SECVID_TSB_CNTL, 0x0);
  538. kgsl_regwrite(device, GEN7_RBBM_SECVID_TSB_TRUSTED_BASE_LO,
  539. lower_32_bits(KGSL_IOMMU_SECURE_BASE32));
  540. kgsl_regwrite(device, GEN7_RBBM_SECVID_TSB_TRUSTED_BASE_HI,
  541. upper_32_bits(KGSL_IOMMU_SECURE_BASE32));
  542. kgsl_regwrite(device, GEN7_RBBM_SECVID_TSB_TRUSTED_SIZE,
  543. FIELD_PREP(GENMASK(31, 12),
  544. (KGSL_IOMMU_SECURE_SIZE(&device->mmu) / SZ_4K)));
  545. }
  546. /* Set UCHE_TRAP_BASE to a page below the top of the memory space */
  547. #define GEN7_UCHE_TRAP_BASE 0x1FFFFFFFFF000ULL
  548. static u64 gen7_get_uche_trap_base(void)
  549. {
  550. return GEN7_UCHE_TRAP_BASE;
  551. }
  552. /*
  553. * All Gen7 targets support marking certain transactions as always privileged
  554. * which allows us to mark more memory as privileged without having to
  555. * explicitly set the APRIV bit. Choose the following transactions to be
  556. * privileged by default:
  557. * CDWRITE [6:6] - Crashdumper writes
  558. * CDREAD [5:5] - Crashdumper reads
  559. * RBRPWB [3:3] - RPTR shadow writes
  560. * RBPRIVLEVEL [2:2] - Memory accesses from PM4 packets in the ringbuffer
  561. * RBFETCH [1:1] - Ringbuffer reads
  562. * ICACHE [0:0] - Instruction cache fetches
  563. */
  564. #define GEN7_APRIV_DEFAULT (BIT(3) | BIT(2) | BIT(1) | BIT(0))
  565. /* Add crashdumper permissions for the BR APRIV */
  566. #define GEN7_BR_APRIV_DEFAULT (GEN7_APRIV_DEFAULT | BIT(6) | BIT(5))
  567. void gen7_enable_ahb_timeout_detection(struct adreno_device *adreno_dev)
  568. {
  569. u32 val;
  570. if (!adreno_dev->ahb_timeout_val)
  571. return;
  572. val = (ADRENO_AHB_CNTL_DEFAULT | FIELD_PREP(GENMASK(4, 0),
  573. adreno_dev->ahb_timeout_val));
  574. adreno_cx_misc_regwrite(adreno_dev, GEN7_GPU_CX_MISC_CX_AHB_AON_CNTL, val);
  575. adreno_cx_misc_regwrite(adreno_dev, GEN7_GPU_CX_MISC_CX_AHB_GMU_CNTL, val);
  576. adreno_cx_misc_regwrite(adreno_dev, GEN7_GPU_CX_MISC_CX_AHB_CP_CNTL, val);
  577. adreno_cx_misc_regwrite(adreno_dev, GEN7_GPU_CX_MISC_CX_AHB_VBIF_SMMU_CNTL, val);
  578. adreno_cx_misc_regwrite(adreno_dev, GEN7_GPU_CX_MISC_CX_AHB_HOST_CNTL, val);
  579. }
  580. int gen7_start(struct adreno_device *adreno_dev)
  581. {
  582. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  583. const struct adreno_gen7_core *gen7_core = to_gen7_core(adreno_dev);
  584. u32 mal, mode = 0, rgb565_predicator = 0;
  585. /*
  586. * HBB values 13 to 16 can represented LSB of HBB from 0 to 3.
  587. * Any HBB value beyond 16 needs programming MSB of HBB.
  588. * By default highest bank bit is 14, Hence set default HBB LSB
  589. * to "1" and MSB to "0".
  590. */
  591. u32 hbb_lo = 1, hbb_hi = 0;
  592. struct cpu_gpu_lock *pwrup_lock = adreno_dev->pwrup_reglist->hostptr;
  593. u64 uche_trap_base = gen7_get_uche_trap_base();
  594. /* Set up GBIF registers from the GPU core definition */
  595. kgsl_regmap_multi_write(&device->regmap, gen7_core->gbif,
  596. gen7_core->gbif_count);
  597. kgsl_regwrite(device, GEN7_UCHE_GBIF_GX_CONFIG, 0x10240e0);
  598. /* Make all blocks contribute to the GPU BUSY perf counter */
  599. kgsl_regwrite(device, GEN7_RBBM_PERFCTR_GPU_BUSY_MASKED, 0xffffffff);
  600. /*
  601. * Set UCHE_WRITE_THRU_BASE to the UCHE_TRAP_BASE effectively
  602. * disabling L2 bypass
  603. */
  604. kgsl_regwrite(device, GEN7_UCHE_TRAP_BASE_LO, lower_32_bits(uche_trap_base));
  605. kgsl_regwrite(device, GEN7_UCHE_TRAP_BASE_HI, upper_32_bits(uche_trap_base));
  606. kgsl_regwrite(device, GEN7_UCHE_WRITE_THRU_BASE_LO, lower_32_bits(uche_trap_base));
  607. kgsl_regwrite(device, GEN7_UCHE_WRITE_THRU_BASE_HI, upper_32_bits(uche_trap_base));
  608. /*
  609. * Some gen7 targets don't use a programmed UCHE GMEM base address,
  610. * so skip programming the register for such targets.
  611. */
  612. if (adreno_dev->uche_gmem_base) {
  613. kgsl_regwrite(device, GEN7_UCHE_GMEM_RANGE_MIN_LO,
  614. adreno_dev->uche_gmem_base);
  615. kgsl_regwrite(device, GEN7_UCHE_GMEM_RANGE_MIN_HI, 0x0);
  616. kgsl_regwrite(device, GEN7_UCHE_GMEM_RANGE_MAX_LO,
  617. adreno_dev->uche_gmem_base +
  618. adreno_dev->gpucore->gmem_size - 1);
  619. kgsl_regwrite(device, GEN7_UCHE_GMEM_RANGE_MAX_HI, 0x0);
  620. }
  621. kgsl_regwrite(device, GEN7_UCHE_CACHE_WAYS, 0x800000);
  622. /*
  623. * Disable LPAC hard sync event to fix lock up issue when BR/BV event
  624. * fifo is full.
  625. */
  626. if (adreno_dev->lpac_enabled)
  627. kgsl_regrmw(device, GEN7_UCHE_DBG_CNTL_1, BIT(30), BIT(30));
  628. kgsl_regwrite(device, GEN7_UCHE_CMDQ_CONFIG,
  629. FIELD_PREP(GENMASK(19, 16), 6) |
  630. FIELD_PREP(GENMASK(15, 12), 6) |
  631. FIELD_PREP(GENMASK(11, 8), 9) |
  632. BIT(3) | BIT(2) |
  633. FIELD_PREP(GENMASK(1, 0), 2));
  634. /*
  635. * CP takes care of the restore during IFPC exit. We need to restore at slumber
  636. * boundary as well
  637. */
  638. if (pwrup_lock->dynamic_list_len > 0)
  639. kgsl_regwrite(device, GEN7_RBBM_PERFCTR_CNTL, 0x1);
  640. /* Turn on the IFPC counter (countable 4 on XOCLK4) */
  641. kgsl_regwrite(device, GEN7_GMU_CX_GMU_POWER_COUNTER_SELECT_1,
  642. FIELD_PREP(GENMASK(7, 0), 0x4));
  643. /* Turn on counter to count total time spent in BCL throttle */
  644. if (adreno_dev->bcl_enabled && adreno_is_gen7_2_x_family(adreno_dev))
  645. kgsl_regrmw(device, GEN7_GMU_CX_GMU_POWER_COUNTER_SELECT_1, GENMASK(15, 8),
  646. FIELD_PREP(GENMASK(15, 8), 0x26));
  647. if (of_property_read_u32(device->pdev->dev.of_node,
  648. "qcom,min-access-length", &mal))
  649. mal = 32;
  650. of_property_read_u32(device->pdev->dev.of_node,
  651. "qcom,ubwc-mode", &mode);
  652. if (!WARN_ON(!adreno_dev->highest_bank_bit)) {
  653. hbb_lo = (adreno_dev->highest_bank_bit - 13) & 3;
  654. hbb_hi = ((adreno_dev->highest_bank_bit - 13) >> 2) & 1;
  655. }
  656. if (mode == KGSL_UBWC_4_0)
  657. rgb565_predicator = 1;
  658. kgsl_regwrite(device, GEN7_RB_NC_MODE_CNTL,
  659. ((rgb565_predicator == 1) ? BIT(11) : 0) |
  660. ((hbb_hi == 1) ? BIT(10) : 0) |
  661. BIT(4) | /*AMSBC is enabled on UBWC 3.0 and 4.0 */
  662. ((mal == 64) ? BIT(3) : 0) |
  663. FIELD_PREP(GENMASK(2, 1), hbb_lo));
  664. kgsl_regwrite(device, GEN7_TPL1_NC_MODE_CNTL,
  665. ((hbb_hi == 1) ? BIT(4) : 0) |
  666. ((mal == 64) ? BIT(3) : 0) |
  667. FIELD_PREP(GENMASK(2, 1), hbb_lo));
  668. /* Configure TP bicubic registers */
  669. if (adreno_is_gen7_9_x(adreno_dev)) {
  670. kgsl_regwrite(device, GEN7_TPL1_BICUBIC_WEIGHTS_TABLE_1, 0x3fe05ff4);
  671. kgsl_regwrite(device, GEN7_TPL1_BICUBIC_WEIGHTS_TABLE_2, 0x3fa0ebee);
  672. kgsl_regwrite(device, GEN7_TPL1_BICUBIC_WEIGHTS_TABLE_3, 0x3f5193ed);
  673. kgsl_regwrite(device, GEN7_TPL1_BICUBIC_WEIGHTS_TABLE_4, 0x3f0243f0);
  674. }
  675. kgsl_regwrite(device, GEN7_SP_NC_MODE_CNTL,
  676. FIELD_PREP(GENMASK(11, 10), hbb_hi) |
  677. FIELD_PREP(GENMASK(5, 4), 2) |
  678. ((mal == 64) ? BIT(3) : 0) |
  679. FIELD_PREP(GENMASK(2, 1), hbb_lo));
  680. kgsl_regwrite(device, GEN7_GRAS_NC_MODE_CNTL,
  681. FIELD_PREP(GENMASK(8, 5),
  682. (adreno_dev->highest_bank_bit - 13)));
  683. kgsl_regwrite(device, GEN7_UCHE_MODE_CNTL,
  684. ((mal == 64) ? BIT(23) : 0) |
  685. FIELD_PREP(GENMASK(22, 21), hbb_lo));
  686. kgsl_regwrite(device, GEN7_RBBM_INTERFACE_HANG_INT_CNTL, BIT(30) |
  687. FIELD_PREP(GENMASK(27, 0),
  688. gen7_core->hang_detect_cycles));
  689. kgsl_regwrite(device, GEN7_UCHE_CLIENT_PF, BIT(7) |
  690. FIELD_PREP(GENMASK(3, 0), adreno_dev->uche_client_pf));
  691. /* Enable the GMEM save/restore feature for preemption */
  692. if (adreno_is_preemption_enabled(adreno_dev))
  693. kgsl_regwrite(device, GEN7_RB_CONTEXT_SWITCH_GMEM_SAVE_RESTORE,
  694. 0x1);
  695. if (adreno_is_gen7_9_x(adreno_dev)) {
  696. /* Disable ubwc merged UFC request feature */
  697. kgsl_regrmw(device, GEN7_RB_CMP_DBG_ECO_CNTL, BIT(19), BIT(19));
  698. /* Enable TP flaghint and other performance settings */
  699. kgsl_regwrite(device, GEN7_TPL1_DBG_ECO_CNTL1, 0xc0700);
  700. } else {
  701. /* Disable non-ubwc read reqs from passing write reqs */
  702. kgsl_regrmw(device, GEN7_RB_CMP_DBG_ECO_CNTL, BIT(11), BIT(11));
  703. }
  704. /* Enable GMU power counter 0 to count GPU busy */
  705. kgsl_regwrite(device, GEN7_GPU_GMU_AO_GPU_CX_BUSY_MASK, 0xff000000);
  706. kgsl_regrmw(device, GEN7_GMU_CX_GMU_POWER_COUNTER_SELECT_0,
  707. 0xFF, 0x20);
  708. kgsl_regwrite(device, GEN7_GMU_CX_GMU_POWER_COUNTER_ENABLE, 0x1);
  709. gen7_protect_init(adreno_dev);
  710. /* Configure LLCC */
  711. _llc_configure_gpu_scid(adreno_dev);
  712. _llc_gpuhtw_slice_activate(adreno_dev);
  713. kgsl_regwrite(device, GEN7_CP_APRIV_CNTL, GEN7_BR_APRIV_DEFAULT);
  714. kgsl_regwrite(device, GEN7_CP_BV_APRIV_CNTL, GEN7_APRIV_DEFAULT);
  715. kgsl_regwrite(device, GEN7_CP_LPAC_APRIV_CNTL, GEN7_APRIV_DEFAULT);
  716. /* Marking AQE Instruction cache fetches as privileged */
  717. if (ADRENO_FEATURE(adreno_dev, ADRENO_AQE))
  718. kgsl_regwrite(device, GEN7_CP_AQE_APRIV_CNTL, BIT(0));
  719. if (adreno_is_gen7_9_x(adreno_dev))
  720. kgsl_regrmw(device, GEN7_GBIF_CX_CONFIG, GENMASK(31, 29),
  721. FIELD_PREP(GENMASK(31, 29), 1));
  722. /*
  723. * CP Icache prefetch brings no benefit on few gen7 variants because of
  724. * the prefetch granularity size.
  725. */
  726. if (adreno_is_gen7_0_0(adreno_dev) || adreno_is_gen7_0_1(adreno_dev) ||
  727. adreno_is_gen7_4_0(adreno_dev) || adreno_is_gen7_2_0(adreno_dev)
  728. || adreno_is_gen7_2_1(adreno_dev) || adreno_is_gen7_11_0(adreno_dev)) {
  729. kgsl_regwrite(device, GEN7_CP_CHICKEN_DBG, 0x1);
  730. kgsl_regwrite(device, GEN7_CP_BV_CHICKEN_DBG, 0x1);
  731. kgsl_regwrite(device, GEN7_CP_LPAC_CHICKEN_DBG, 0x1);
  732. }
  733. _set_secvid(device);
  734. /*
  735. * Enable hardware clock gating here to prevent any register access
  736. * issue due to internal clock gating.
  737. */
  738. gen7_hwcg_set(adreno_dev, true);
  739. /*
  740. * All registers must be written before this point so that we don't
  741. * miss any register programming when we patch the power up register
  742. * list.
  743. */
  744. if (!adreno_dev->patch_reglist &&
  745. (adreno_dev->pwrup_reglist->gpuaddr != 0)) {
  746. gen7_patch_pwrup_reglist(adreno_dev);
  747. adreno_dev->patch_reglist = true;
  748. }
  749. return 0;
  750. }
  751. /* Offsets into the MX/CX mapped register regions */
  752. #define GEN7_RDPM_MX_OFFSET 0xf00
  753. #define GEN7_RDPM_CX_OFFSET 0xf14
  754. void gen7_rdpm_mx_freq_update(struct gen7_gmu_device *gmu, u32 freq)
  755. {
  756. if (gmu->rdpm_mx_virt) {
  757. writel_relaxed(freq/1000, (gmu->rdpm_mx_virt + GEN7_RDPM_MX_OFFSET));
  758. /*
  759. * ensure previous writes post before this one,
  760. * i.e. act like normal writel()
  761. */
  762. wmb();
  763. }
  764. }
  765. void gen7_rdpm_cx_freq_update(struct gen7_gmu_device *gmu, u32 freq)
  766. {
  767. if (gmu->rdpm_cx_virt) {
  768. writel_relaxed(freq/1000, (gmu->rdpm_cx_virt + GEN7_RDPM_CX_OFFSET));
  769. /*
  770. * ensure previous writes post before this one,
  771. * i.e. act like normal writel()
  772. */
  773. wmb();
  774. }
  775. }
  776. int gen7_scm_gpu_init_cx_regs(struct adreno_device *adreno_dev)
  777. {
  778. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  779. u32 gpu_req = GPU_ALWAYS_EN_REQ;
  780. int ret;
  781. if (ADRENO_FEATURE(adreno_dev, ADRENO_BCL))
  782. gpu_req |= GPU_BCL_EN_REQ;
  783. if (ADRENO_FEATURE(adreno_dev, ADRENO_CLX))
  784. gpu_req |= GPU_CLX_EN_REQ;
  785. if (adreno_is_gen7_9_x(adreno_dev))
  786. gpu_req |= GPU_TSENSE_EN_REQ;
  787. ret = kgsl_scm_gpu_init_regs(&device->pdev->dev, gpu_req);
  788. /*
  789. * For targets that support this scm call to program BCL id , enable BCL.
  790. * For other targets, BCL is enabled after first GMU boot.
  791. */
  792. if (!ret && ADRENO_FEATURE(adreno_dev, ADRENO_BCL))
  793. adreno_dev->bcl_enabled = true;
  794. /* If programming TZ CLX was successful, then program KMD owned CLX regs */
  795. if (!ret && ADRENO_FEATURE(adreno_dev, ADRENO_CLX))
  796. adreno_dev->clx_enabled = true;
  797. /*
  798. * If scm call returned EOPNOTSUPP, either we are on a kernel version
  799. * lesser than 6.1 where scm call is not supported or we are sending an
  800. * empty request. Ignore the error in such cases.
  801. */
  802. return (ret == -EOPNOTSUPP) ? 0 : ret;
  803. }
  804. void gen7_spin_idle_debug(struct adreno_device *adreno_dev,
  805. const char *str)
  806. {
  807. struct kgsl_device *device = &adreno_dev->dev;
  808. unsigned int rptr, wptr;
  809. unsigned int status, status3, intstatus;
  810. unsigned int hwfault;
  811. dev_err(device->dev, str);
  812. kgsl_regread(device, GEN7_CP_RB_RPTR, &rptr);
  813. kgsl_regread(device, GEN7_CP_RB_WPTR, &wptr);
  814. kgsl_regread(device, GEN7_RBBM_STATUS, &status);
  815. kgsl_regread(device, GEN7_RBBM_STATUS3, &status3);
  816. kgsl_regread(device, GEN7_RBBM_INT_0_STATUS, &intstatus);
  817. kgsl_regread(device, GEN7_CP_HW_FAULT, &hwfault);
  818. dev_err(device->dev,
  819. "rb=%d pos=%X/%X rbbm_status=%8.8X/%8.8X int_0_status=%8.8X\n",
  820. adreno_dev->cur_rb ? adreno_dev->cur_rb->id : -1, rptr, wptr,
  821. status, status3, intstatus);
  822. dev_err(device->dev, " hwfault=%8.8X\n", hwfault);
  823. kgsl_device_snapshot(device, NULL, NULL, false);
  824. }
  825. /*
  826. * gen7_send_cp_init() - Initialize ringbuffer
  827. * @adreno_dev: Pointer to adreno device
  828. * @rb: Pointer to the ringbuffer of device
  829. *
  830. * Submit commands for ME initialization,
  831. */
  832. static int gen7_send_cp_init(struct adreno_device *adreno_dev,
  833. struct adreno_ringbuffer *rb)
  834. {
  835. unsigned int *cmds;
  836. int ret;
  837. cmds = adreno_ringbuffer_allocspace(rb, GEN7_CP_INIT_DWORDS);
  838. if (IS_ERR(cmds))
  839. return PTR_ERR(cmds);
  840. gen7_cp_init_cmds(adreno_dev, cmds);
  841. ret = gen7_ringbuffer_submit(rb, NULL);
  842. if (!ret) {
  843. ret = adreno_spin_idle(adreno_dev, 2000);
  844. if (ret) {
  845. gen7_spin_idle_debug(adreno_dev,
  846. "CP initialization failed to idle\n");
  847. rb->wptr = 0;
  848. rb->_wptr = 0;
  849. }
  850. }
  851. return ret;
  852. }
  853. static int gen7_post_start(struct adreno_device *adreno_dev)
  854. {
  855. int ret;
  856. unsigned int *cmds;
  857. struct adreno_ringbuffer *rb = adreno_dev->cur_rb;
  858. struct adreno_preemption *preempt = &adreno_dev->preempt;
  859. u64 kmd_postamble_addr;
  860. if (!adreno_is_preemption_enabled(adreno_dev))
  861. return 0;
  862. kmd_postamble_addr = SCRATCH_POSTAMBLE_ADDR(KGSL_DEVICE(adreno_dev));
  863. gen7_preemption_prepare_postamble(adreno_dev);
  864. cmds = adreno_ringbuffer_allocspace(rb, (preempt->postamble_bootup_len ? 16 : 12));
  865. if (IS_ERR(cmds))
  866. return PTR_ERR(cmds);
  867. *cmds++ = cp_type7_packet(CP_SET_PSEUDO_REGISTER, 6);
  868. *cmds++ = SET_PSEUDO_PRIV_NON_SECURE_SAVE_ADDR;
  869. *cmds++ = lower_32_bits(rb->preemption_desc->gpuaddr);
  870. *cmds++ = upper_32_bits(rb->preemption_desc->gpuaddr);
  871. *cmds++ = SET_PSEUDO_PRIV_SECURE_SAVE_ADDR;
  872. *cmds++ = lower_32_bits(rb->secure_preemption_desc->gpuaddr);
  873. *cmds++ = upper_32_bits(rb->secure_preemption_desc->gpuaddr);
  874. if (preempt->postamble_bootup_len) {
  875. *cmds++ = cp_type7_packet(CP_SET_AMBLE, 3);
  876. *cmds++ = lower_32_bits(kmd_postamble_addr);
  877. *cmds++ = upper_32_bits(kmd_postamble_addr);
  878. *cmds++ = FIELD_PREP(GENMASK(22, 20), CP_KMD_AMBLE_TYPE)
  879. | (FIELD_PREP(GENMASK(19, 0), adreno_dev->preempt.postamble_bootup_len));
  880. }
  881. *cmds++ = cp_type7_packet(CP_CONTEXT_SWITCH_YIELD, 4);
  882. *cmds++ = 0;
  883. *cmds++ = 0;
  884. *cmds++ = 0;
  885. /* generate interrupt on preemption completion */
  886. *cmds++ = 0;
  887. ret = gen7_ringbuffer_submit(rb, NULL);
  888. if (!ret) {
  889. ret = adreno_spin_idle(adreno_dev, 2000);
  890. if (ret)
  891. gen7_spin_idle_debug(adreno_dev,
  892. "hw preemption initialization failed to idle\n");
  893. }
  894. return ret;
  895. }
  896. int gen7_rb_start(struct adreno_device *adreno_dev)
  897. {
  898. const struct adreno_gen7_core *gen7_core = to_gen7_core(adreno_dev);
  899. struct adreno_firmware *fw = ADRENO_FW(adreno_dev, ADRENO_FW_SQE);
  900. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  901. struct adreno_ringbuffer *rb;
  902. u64 addr;
  903. int ret, i;
  904. unsigned int *cmds;
  905. /* Clear all the ringbuffers */
  906. FOR_EACH_RINGBUFFER(adreno_dev, rb, i) {
  907. memset(rb->buffer_desc->hostptr, 0xaa, KGSL_RB_SIZE);
  908. kgsl_sharedmem_writel(device->scratch,
  909. SCRATCH_RB_OFFSET(rb->id, rptr), 0);
  910. kgsl_sharedmem_writel(device->scratch,
  911. SCRATCH_RB_OFFSET(rb->id, bv_rptr), 0);
  912. rb->wptr = 0;
  913. rb->_wptr = 0;
  914. rb->wptr_preempt_end = UINT_MAX;
  915. }
  916. gen7_preemption_start(adreno_dev);
  917. /* Set up the current ringbuffer */
  918. rb = ADRENO_CURRENT_RINGBUFFER(adreno_dev);
  919. addr = SCRATCH_RB_GPU_ADDR(device, rb->id, rptr);
  920. kgsl_regwrite(device, GEN7_CP_RB_RPTR_ADDR_LO, lower_32_bits(addr));
  921. kgsl_regwrite(device, GEN7_CP_RB_RPTR_ADDR_HI, upper_32_bits(addr));
  922. addr = SCRATCH_RB_GPU_ADDR(device, rb->id, bv_rptr);
  923. kgsl_regwrite(device, GEN7_CP_BV_RB_RPTR_ADDR_LO, lower_32_bits(addr));
  924. kgsl_regwrite(device, GEN7_CP_BV_RB_RPTR_ADDR_HI, upper_32_bits(addr));
  925. kgsl_regwrite(device, GEN7_CP_RB_CNTL, GEN7_CP_RB_CNTL_DEFAULT);
  926. kgsl_regwrite(device, GEN7_CP_RB_BASE,
  927. lower_32_bits(rb->buffer_desc->gpuaddr));
  928. kgsl_regwrite(device, GEN7_CP_RB_BASE_HI,
  929. upper_32_bits(rb->buffer_desc->gpuaddr));
  930. /* Program the ucode base for CP */
  931. kgsl_regwrite(device, GEN7_CP_SQE_INSTR_BASE_LO,
  932. lower_32_bits(fw->memdesc->gpuaddr));
  933. kgsl_regwrite(device, GEN7_CP_SQE_INSTR_BASE_HI,
  934. upper_32_bits(fw->memdesc->gpuaddr));
  935. /* Clear the SQE_HALT to start the CP engine */
  936. kgsl_regwrite(device, GEN7_CP_SQE_CNTL, 1);
  937. ret = gen7_send_cp_init(adreno_dev, rb);
  938. if (ret)
  939. return ret;
  940. ret = adreno_zap_shader_load(adreno_dev, gen7_core->zap_name);
  941. if (ret)
  942. return ret;
  943. /*
  944. * Take the GPU out of secure mode. Try the zap shader if it is loaded,
  945. * otherwise just try to write directly to the secure control register
  946. */
  947. if (!adreno_dev->zap_loaded)
  948. kgsl_regwrite(device, GEN7_RBBM_SECVID_TRUST_CNTL, 0);
  949. else {
  950. cmds = adreno_ringbuffer_allocspace(rb, 2);
  951. if (IS_ERR(cmds))
  952. return PTR_ERR(cmds);
  953. *cmds++ = cp_type7_packet(CP_SET_SECURE_MODE, 1);
  954. *cmds++ = 0;
  955. ret = gen7_ringbuffer_submit(rb, NULL);
  956. if (!ret) {
  957. ret = adreno_spin_idle(adreno_dev, 2000);
  958. if (ret) {
  959. gen7_spin_idle_debug(adreno_dev,
  960. "Switch to unsecure failed to idle\n");
  961. return ret;
  962. }
  963. }
  964. }
  965. return gen7_post_start(adreno_dev);
  966. }
  967. /*
  968. * gen7_gpu_keepalive() - GMU reg write to request GPU stays on
  969. * @adreno_dev: Pointer to the adreno device that has the GMU
  970. * @state: State to set: true is ON, false is OFF
  971. */
  972. static void gen7_gpu_keepalive(struct adreno_device *adreno_dev,
  973. bool state)
  974. {
  975. gmu_core_regwrite(KGSL_DEVICE(adreno_dev),
  976. GEN7_GMU_GMU_PWR_COL_KEEPALIVE, state);
  977. }
  978. bool gen7_hw_isidle(struct adreno_device *adreno_dev)
  979. {
  980. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  981. unsigned int reg;
  982. gmu_core_regread(device, GEN7_GPU_GMU_AO_GPU_CX_BUSY_STATUS, &reg);
  983. /* Bit 23 is GPUBUSYIGNAHB */
  984. return (reg & BIT(23)) ? false : true;
  985. }
  986. int gen7_microcode_read(struct adreno_device *adreno_dev)
  987. {
  988. struct adreno_firmware *sqe_fw = ADRENO_FW(adreno_dev, ADRENO_FW_SQE);
  989. const struct adreno_gen7_core *gen7_core = to_gen7_core(adreno_dev);
  990. return adreno_get_firmware(adreno_dev, gen7_core->sqefw_name, sqe_fw);
  991. }
  992. /* CP Interrupt bits */
  993. #define CP_INT_OPCODEERROR 0
  994. #define CP_INT_UCODEERROR 1
  995. #define CP_INT_CPHWFAULT 2
  996. #define CP_INT_REGISTERPROTECTION 4
  997. #define CP_INT_VSDPARITYERROR 6
  998. #define CP_INT_ILLEGALINSTRUCTION 7
  999. #define CP_INT_OPCODEERRORLPAC 8
  1000. #define CP_INT_UCODEERRORLPAC 9
  1001. #define CP_INT_CPHWFAULTLPAC 10
  1002. #define CP_INT_REGISTERPROTECTIONLPAC 11
  1003. #define CP_INT_ILLEGALINSTRUCTIONLPAC 12
  1004. #define CP_INT_OPCODEERRORBV 13
  1005. #define CP_INT_UCODEERRORBV 14
  1006. #define CP_INT_CPHWFAULTBV 15
  1007. #define CP_INT_REGISTERPROTECTIONBV 16
  1008. #define CP_INT_ILLEGALINSTRUCTIONBV 17
  1009. static void gen7_cp_hw_err_callback(struct adreno_device *adreno_dev, int bit)
  1010. {
  1011. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1012. unsigned int status1, status2;
  1013. struct device *dev = device->dev;
  1014. unsigned int opcode;
  1015. kgsl_regread(device, GEN7_CP_INTERRUPT_STATUS, &status1);
  1016. if (status1 & BIT(CP_INT_OPCODEERROR)) {
  1017. kgsl_regwrite(device, GEN7_CP_SQE_STAT_ADDR, 1);
  1018. kgsl_regread(device, GEN7_CP_SQE_STAT_DATA, &opcode);
  1019. dev_crit_ratelimited(dev,
  1020. "CP opcode error interrupt | opcode=0x%8.8x\n", opcode);
  1021. }
  1022. if (status1 & BIT(CP_INT_UCODEERROR))
  1023. dev_crit_ratelimited(dev, "CP ucode error interrupt\n");
  1024. if (status1 & BIT(CP_INT_CPHWFAULT)) {
  1025. kgsl_regread(device, GEN7_CP_HW_FAULT, &status2);
  1026. dev_crit_ratelimited(dev,
  1027. "CP | Ringbuffer HW fault | status=%x\n", status2);
  1028. }
  1029. if (status1 & BIT(CP_INT_REGISTERPROTECTION)) {
  1030. kgsl_regread(device, GEN7_CP_PROTECT_STATUS, &status2);
  1031. dev_crit_ratelimited(dev,
  1032. "CP | Protected mode error | %s | addr=%x | status=%x\n",
  1033. status2 & BIT(20) ? "READ" : "WRITE",
  1034. status2 & 0x3ffff, status2);
  1035. }
  1036. if (status1 & BIT(CP_INT_VSDPARITYERROR))
  1037. dev_crit_ratelimited(dev, "CP VSD decoder parity error\n");
  1038. if (status1 & BIT(CP_INT_ILLEGALINSTRUCTION))
  1039. dev_crit_ratelimited(dev, "CP Illegal instruction error\n");
  1040. if (status1 & BIT(CP_INT_OPCODEERRORLPAC))
  1041. dev_crit_ratelimited(dev, "CP Opcode error LPAC\n");
  1042. if (status1 & BIT(CP_INT_UCODEERRORLPAC))
  1043. dev_crit_ratelimited(dev, "CP ucode error LPAC\n");
  1044. if (status1 & BIT(CP_INT_CPHWFAULTLPAC))
  1045. dev_crit_ratelimited(dev, "CP hw fault LPAC\n");
  1046. if (status1 & BIT(CP_INT_REGISTERPROTECTIONLPAC))
  1047. dev_crit_ratelimited(dev, "CP register protection LPAC\n");
  1048. if (status1 & BIT(CP_INT_ILLEGALINSTRUCTIONLPAC))
  1049. dev_crit_ratelimited(dev, "CP illegal instruction LPAC\n");
  1050. if (status1 & BIT(CP_INT_OPCODEERRORBV)) {
  1051. kgsl_regwrite(device, GEN7_CP_BV_SQE_STAT_ADDR, 1);
  1052. kgsl_regread(device, GEN7_CP_BV_SQE_STAT_DATA, &opcode);
  1053. dev_crit_ratelimited(dev, "CP opcode error BV | opcode=0x%8.8x\n", opcode);
  1054. }
  1055. if (status1 & BIT(CP_INT_UCODEERRORBV))
  1056. dev_crit_ratelimited(dev, "CP ucode error BV\n");
  1057. if (status1 & BIT(CP_INT_CPHWFAULTBV)) {
  1058. kgsl_regread(device, GEN7_CP_BV_HW_FAULT, &status2);
  1059. dev_crit_ratelimited(dev,
  1060. "CP BV | Ringbuffer HW fault | status=%x\n", status2);
  1061. }
  1062. if (status1 & BIT(CP_INT_REGISTERPROTECTIONBV)) {
  1063. kgsl_regread(device, GEN7_CP_BV_PROTECT_STATUS, &status2);
  1064. dev_crit_ratelimited(dev,
  1065. "CP BV | Protected mode error | %s | addr=%x | status=%x\n",
  1066. status2 & BIT(20) ? "READ" : "WRITE",
  1067. status2 & 0x3ffff, status2);
  1068. }
  1069. if (status1 & BIT(CP_INT_ILLEGALINSTRUCTIONBV))
  1070. dev_crit_ratelimited(dev, "CP illegal instruction BV\n");
  1071. }
  1072. static void gen7_err_callback(struct adreno_device *adreno_dev, int bit)
  1073. {
  1074. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1075. struct device *dev = device->dev;
  1076. switch (bit) {
  1077. case GEN7_INT_AHBERROR:
  1078. {
  1079. u32 err_details_0, err_details_1;
  1080. kgsl_regread(device, GEN7_CP_RL_ERROR_DETAILS_0, &err_details_0);
  1081. kgsl_regread(device, GEN7_CP_RL_ERROR_DETAILS_1, &err_details_1);
  1082. dev_crit_ratelimited(dev,
  1083. "CP: AHB bus error, CP_RL_ERROR_DETAILS_0:0x%x CP_RL_ERROR_DETAILS_1:0x%x\n",
  1084. err_details_0, err_details_1);
  1085. break;
  1086. }
  1087. case GEN7_INT_ATBASYNCFIFOOVERFLOW:
  1088. dev_crit_ratelimited(dev, "RBBM: ATB ASYNC overflow\n");
  1089. break;
  1090. case GEN7_INT_ATBBUSOVERFLOW:
  1091. dev_crit_ratelimited(dev, "RBBM: ATB bus overflow\n");
  1092. break;
  1093. case GEN7_INT_OUTOFBOUNDACCESS:
  1094. dev_crit_ratelimited(dev, "UCHE: Out of bounds access\n");
  1095. break;
  1096. case GEN7_INT_UCHETRAPINTERRUPT:
  1097. dev_crit_ratelimited(dev, "UCHE: Trap interrupt\n");
  1098. break;
  1099. case GEN7_INT_TSBWRITEERROR:
  1100. {
  1101. u32 lo, hi;
  1102. kgsl_regread(device, GEN7_RBBM_SECVID_TSB_STATUS_LO, &lo);
  1103. kgsl_regread(device, GEN7_RBBM_SECVID_TSB_STATUS_HI, &hi);
  1104. dev_crit_ratelimited(dev, "TSB: Write error interrupt: Address: 0x%lx MID: %lu\n",
  1105. FIELD_GET(GENMASK(16, 0), hi) << 32 | lo,
  1106. FIELD_GET(GENMASK(31, 23), hi));
  1107. break;
  1108. }
  1109. default:
  1110. dev_crit_ratelimited(dev, "Unknown interrupt %d\n", bit);
  1111. }
  1112. }
  1113. static const char *const uche_client[] = {
  1114. "BR_VFD", "BR_SP", "BR_VSC", "BR_VPC",
  1115. "BR_HLSQ", "BR_PC", "BR_LRZ", "BR_TP",
  1116. "BV_VFD", "BV_SP", "BV_VSC", "BV_VPC",
  1117. "BV_HLSQ", "BV_PC", "BV_LRZ", "BV_TP"
  1118. };
  1119. static const char *const uche_lpac_client[] = {
  1120. "-", "SP_LPAC", "-", "-", "HLSQ_LPAC", "-", "-", "TP_LPAC"
  1121. };
  1122. #define SCOOBYDOO 0x5c00bd00
  1123. static const char *gen7_fault_block_uche(struct kgsl_device *device,
  1124. char *str, int size, bool lpac)
  1125. {
  1126. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  1127. unsigned int uche_client_id = adreno_dev->uche_client_pf;
  1128. const char *uche_client_str, *fault_block;
  1129. /*
  1130. * Smmu driver takes a vote on CX gdsc before calling the kgsl
  1131. * pagefault handler. If there is contention for device mutex in this
  1132. * path and the dispatcher fault handler is holding this lock, trying
  1133. * to turn off CX gdsc will fail during the reset. So to avoid blocking
  1134. * here, try to lock device mutex and return if it fails.
  1135. */
  1136. if (!mutex_trylock(&device->mutex))
  1137. goto regread_fail;
  1138. if (!kgsl_state_is_awake(device)) {
  1139. mutex_unlock(&device->mutex);
  1140. goto regread_fail;
  1141. }
  1142. kgsl_regread(device, GEN7_UCHE_CLIENT_PF, &uche_client_id);
  1143. mutex_unlock(&device->mutex);
  1144. /* Ignore the value if the gpu is in IFPC */
  1145. if (uche_client_id == SCOOBYDOO) {
  1146. uche_client_id = adreno_dev->uche_client_pf;
  1147. goto regread_fail;
  1148. }
  1149. /* UCHE client id mask is bits [6:0] */
  1150. uche_client_id &= GENMASK(6, 0);
  1151. regread_fail:
  1152. if (lpac) {
  1153. fault_block = "UCHE_LPAC";
  1154. if (uche_client_id >= ARRAY_SIZE(uche_lpac_client))
  1155. goto fail;
  1156. uche_client_str = uche_lpac_client[uche_client_id];
  1157. } else {
  1158. fault_block = "UCHE";
  1159. if (uche_client_id >= ARRAY_SIZE(uche_client))
  1160. goto fail;
  1161. uche_client_str = uche_client[uche_client_id];
  1162. }
  1163. snprintf(str, size, "%s: %s", fault_block, uche_client_str);
  1164. return str;
  1165. fail:
  1166. snprintf(str, size, "%s: Unknown (client_id: %u)",
  1167. fault_block, uche_client_id);
  1168. return str;
  1169. }
  1170. static const char *gen7_iommu_fault_block(struct kgsl_device *device,
  1171. unsigned int fsynr1)
  1172. {
  1173. unsigned int mid = fsynr1 & 0xff;
  1174. static char str[36];
  1175. switch (mid) {
  1176. case 0x0:
  1177. return "CP";
  1178. case 0x1:
  1179. return "UCHE: Unknown";
  1180. case 0x2:
  1181. return "UCHE_LPAC: Unknown";
  1182. case 0x3:
  1183. return gen7_fault_block_uche(device, str, sizeof(str), false);
  1184. case 0x4:
  1185. return "CCU";
  1186. case 0x5:
  1187. return "Flag cache";
  1188. case 0x6:
  1189. return "PREFETCH";
  1190. case 0x7:
  1191. return "GMU";
  1192. case 0x8:
  1193. return gen7_fault_block_uche(device, str, sizeof(str), true);
  1194. }
  1195. snprintf(str, sizeof(str), "Unknown (mid: %u)", mid);
  1196. return str;
  1197. }
  1198. static void gen7_cp_callback(struct adreno_device *adreno_dev, int bit)
  1199. {
  1200. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1201. if (adreno_is_preemption_enabled(adreno_dev))
  1202. gen7_preemption_trigger(adreno_dev, true);
  1203. adreno_dispatcher_schedule(device);
  1204. }
  1205. /*
  1206. * gen7_gpc_err_int_callback() - Isr for GPC error interrupts
  1207. * @adreno_dev: Pointer to device
  1208. * @bit: Interrupt bit
  1209. */
  1210. static void gen7_gpc_err_int_callback(struct adreno_device *adreno_dev, int bit)
  1211. {
  1212. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1213. /*
  1214. * GPC error is typically the result of mistake SW programming.
  1215. * Force GPU fault for this interrupt so that we can debug it
  1216. * with help of register dump.
  1217. */
  1218. dev_crit(device->dev, "RBBM: GPC error\n");
  1219. adreno_irqctrl(adreno_dev, 0);
  1220. /* Trigger a fault in the dispatcher - this will effect a restart */
  1221. adreno_dispatcher_fault(adreno_dev, ADRENO_SOFT_FAULT);
  1222. }
  1223. /*
  1224. * gen7_swfuse_violation_callback() - ISR for software fuse violation interrupt
  1225. * @adreno_dev: Pointer to device
  1226. * @bit: Interrupt bit
  1227. */
  1228. static void gen7_swfuse_violation_callback(struct adreno_device *adreno_dev, int bit)
  1229. {
  1230. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1231. u32 status;
  1232. /*
  1233. * SWFUSEVIOLATION error is typically the result of enabling software
  1234. * feature which is not supported by the hardware. Following are the
  1235. * Feature violation will be reported
  1236. * 1) FASTBLEND (BIT:0): NO Fault, RB will send the workload to legacy
  1237. * blender HW pipeline.
  1238. * 2) LPAC (BIT:1): Fault
  1239. * 3) RAYTRACING (BIT:2): Fault
  1240. */
  1241. kgsl_regread(device, GEN7_RBBM_SW_FUSE_INT_STATUS, &status);
  1242. /*
  1243. * RBBM_INT_CLEAR_CMD will not clear SWFUSEVIOLATION interrupt. Hence
  1244. * do explicit swfuse irq clear.
  1245. */
  1246. kgsl_regwrite(device, GEN7_RBBM_SW_FUSE_INT_MASK, 0);
  1247. dev_crit_ratelimited(device->dev,
  1248. "RBBM: SW Feature Fuse violation status=0x%8.8x\n", status);
  1249. /* Trigger a fault in the dispatcher for LPAC and RAYTRACING violation */
  1250. if (status & GENMASK(GEN7_RAYTRACING_SW_FUSE, GEN7_LPAC_SW_FUSE)) {
  1251. adreno_irqctrl(adreno_dev, 0);
  1252. adreno_dispatcher_fault(adreno_dev, ADRENO_HARD_FAULT);
  1253. }
  1254. }
  1255. static const struct adreno_irq_funcs gen7_irq_funcs[32] = {
  1256. ADRENO_IRQ_CALLBACK(NULL), /* 0 - RBBM_GPU_IDLE */
  1257. ADRENO_IRQ_CALLBACK(gen7_err_callback), /* 1 - RBBM_AHB_ERROR */
  1258. ADRENO_IRQ_CALLBACK(NULL), /* 2 - UNUSED */
  1259. ADRENO_IRQ_CALLBACK(NULL), /* 3 - UNUSED */
  1260. ADRENO_IRQ_CALLBACK(NULL), /* 4 - CPIPCINT0 */
  1261. ADRENO_IRQ_CALLBACK(NULL), /* 5 - CPIPCINT1 */
  1262. ADRENO_IRQ_CALLBACK(gen7_err_callback), /* 6 - ATBASYNCOVERFLOW */
  1263. ADRENO_IRQ_CALLBACK(gen7_gpc_err_int_callback), /* 7 - GPC_ERR */
  1264. ADRENO_IRQ_CALLBACK(gen7_preemption_callback),/* 8 - CP_SW */
  1265. ADRENO_IRQ_CALLBACK(gen7_cp_hw_err_callback), /* 9 - CP_HW_ERROR */
  1266. ADRENO_IRQ_CALLBACK(NULL), /* 10 - CP_CCU_FLUSH_DEPTH_TS */
  1267. ADRENO_IRQ_CALLBACK(NULL), /* 11 - CP_CCU_FLUSH_COLOR_TS */
  1268. ADRENO_IRQ_CALLBACK(NULL), /* 12 - CP_CCU_RESOLVE_TS */
  1269. ADRENO_IRQ_CALLBACK(NULL), /* 13 - UNUSED */
  1270. ADRENO_IRQ_CALLBACK(NULL), /* 14 - UNUSED */
  1271. ADRENO_IRQ_CALLBACK(adreno_cp_callback), /* 15 - CP_RB_INT */
  1272. ADRENO_IRQ_CALLBACK(NULL), /* 16 - CP_RB_INT_LPAC*/
  1273. ADRENO_IRQ_CALLBACK(NULL), /* 17 - CP_RB_DONE_TS */
  1274. ADRENO_IRQ_CALLBACK(NULL), /* 18 - UNUSED */
  1275. ADRENO_IRQ_CALLBACK(NULL), /* 19 - UNUSED */
  1276. ADRENO_IRQ_CALLBACK(gen7_cp_callback), /* 20 - CP_CACHE_FLUSH_TS */
  1277. ADRENO_IRQ_CALLBACK(NULL), /* 21 - CP_CACHE_TS_LPAC */
  1278. ADRENO_IRQ_CALLBACK(gen7_err_callback), /* 22 - RBBM_ATB_BUS_OVERFLOW */
  1279. ADRENO_IRQ_CALLBACK(adreno_hang_int_callback), /* 23 - MISHANGDETECT */
  1280. ADRENO_IRQ_CALLBACK(gen7_err_callback), /* 24 - UCHE_OOB_ACCESS */
  1281. ADRENO_IRQ_CALLBACK(gen7_err_callback), /* 25 - UCHE_TRAP_INTR */
  1282. ADRENO_IRQ_CALLBACK(NULL), /* 26 - DEBBUS_INTR_0 */
  1283. ADRENO_IRQ_CALLBACK(NULL), /* 27 - DEBBUS_INTR_1 */
  1284. ADRENO_IRQ_CALLBACK(gen7_err_callback), /* 28 - TSBWRITEERROR */
  1285. ADRENO_IRQ_CALLBACK(gen7_swfuse_violation_callback), /* 29 - SWFUSEVIOLATION */
  1286. ADRENO_IRQ_CALLBACK(NULL), /* 30 - ISDB_CPU_IRQ */
  1287. ADRENO_IRQ_CALLBACK(NULL), /* 31 - ISDB_UNDER_DEBUG */
  1288. };
  1289. /*
  1290. * If the AHB fence is not in ALLOW mode when we receive an RBBM
  1291. * interrupt, something went wrong. This means that we cannot proceed
  1292. * since the IRQ status and clear registers are not accessible.
  1293. * This is usually harmless because the GMU will abort power collapse
  1294. * and change the fence back to ALLOW. Poll so that this can happen.
  1295. */
  1296. static int gen7_irq_poll_fence(struct adreno_device *adreno_dev)
  1297. {
  1298. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1299. const struct adreno_gpudev *gpudev = ADRENO_GPU_DEVICE(adreno_dev);
  1300. u32 status, fence, fence_retries = 0;
  1301. u64 a, b, c;
  1302. a = gpudev->read_alwayson(adreno_dev);
  1303. kgsl_regread(device, GEN7_GMU_AO_AHB_FENCE_CTRL, &fence);
  1304. while (fence != 0) {
  1305. b = gpudev->read_alwayson(adreno_dev);
  1306. /* Wait for small time before trying again */
  1307. udelay(1);
  1308. kgsl_regread(device, GEN7_GMU_AO_AHB_FENCE_CTRL, &fence);
  1309. if (fence_retries == 100 && fence != 0) {
  1310. c = gpudev->read_alwayson(adreno_dev);
  1311. kgsl_regread(device, GEN7_GMU_RBBM_INT_UNMASKED_STATUS,
  1312. &status);
  1313. dev_crit_ratelimited(device->dev,
  1314. "status=0x%x Unmasked status=0x%x Mask=0x%x timestamps: %llx %llx %llx\n",
  1315. status & adreno_dev->irq_mask, status,
  1316. adreno_dev->irq_mask, a, b, c);
  1317. return -ETIMEDOUT;
  1318. }
  1319. fence_retries++;
  1320. }
  1321. return 0;
  1322. }
  1323. static irqreturn_t gen7_irq_handler(struct adreno_device *adreno_dev)
  1324. {
  1325. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1326. irqreturn_t ret = IRQ_NONE;
  1327. u32 status;
  1328. /*
  1329. * GPU can power down once the INT_0_STATUS is read below.
  1330. * But there still might be some register reads required so
  1331. * force the GMU/GPU into KEEPALIVE mode until done with the ISR.
  1332. */
  1333. gen7_gpu_keepalive(adreno_dev, true);
  1334. if (gen7_irq_poll_fence(adreno_dev)) {
  1335. adreno_dispatcher_fault(adreno_dev, ADRENO_GMU_FAULT);
  1336. goto done;
  1337. }
  1338. kgsl_regread(device, GEN7_RBBM_INT_0_STATUS, &status);
  1339. kgsl_regwrite(device, GEN7_RBBM_INT_CLEAR_CMD, status);
  1340. ret = adreno_irq_callbacks(adreno_dev, gen7_irq_funcs, status);
  1341. trace_kgsl_gen7_irq_status(adreno_dev, status);
  1342. done:
  1343. /* If hard fault, then let snapshot turn off the keepalive */
  1344. if (!(adreno_gpu_fault(adreno_dev) & ADRENO_HARD_FAULT))
  1345. gen7_gpu_keepalive(adreno_dev, false);
  1346. return ret;
  1347. }
  1348. int gen7_probe_common(struct platform_device *pdev,
  1349. struct adreno_device *adreno_dev, u32 chipid,
  1350. const struct adreno_gpu_core *gpucore)
  1351. {
  1352. const struct adreno_gpudev *gpudev = gpucore->gpudev;
  1353. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1354. const struct adreno_gen7_core *gen7_core = container_of(gpucore,
  1355. struct adreno_gen7_core, base);
  1356. int ret;
  1357. adreno_dev->gpucore = gpucore;
  1358. adreno_dev->chipid = chipid;
  1359. adreno_dev->cx_misc_base = GEN7_CX_MISC_BASE;
  1360. adreno_reg_offset_init(gpudev->reg_offsets);
  1361. adreno_dev->hwcg_enabled = true;
  1362. adreno_dev->uche_client_pf = 1;
  1363. kgsl_pwrscale_fast_bus_hint(gen7_core->fast_bus_hint);
  1364. device->pwrctrl.rt_bus_hint = gen7_core->rt_bus_hint;
  1365. device->pwrctrl.cx_cfg_gdsc_offset = adreno_is_gen7_11_0(adreno_dev) ?
  1366. GEN7_11_0_GPU_CC_CX_CFG_GDSCR : GEN7_GPU_CC_CX_CFG_GDSCR;
  1367. ret = adreno_device_probe(pdev, adreno_dev);
  1368. if (ret)
  1369. return ret;
  1370. if (adreno_preemption_feature_set(adreno_dev)) {
  1371. const struct adreno_gen7_core *gen7_core = to_gen7_core(adreno_dev);
  1372. adreno_dev->preempt.preempt_level = gen7_core->preempt_level;
  1373. adreno_dev->preempt.skipsaverestore = true;
  1374. adreno_dev->preempt.usesgmem = true;
  1375. set_bit(ADRENO_DEVICE_PREEMPTION, &adreno_dev->priv);
  1376. }
  1377. /* debugfs node for ACD calibration */
  1378. debugfs_create_file("acd_calibrate", 0644, device->d_debugfs, device, &acd_cal_fops);
  1379. gen7_coresight_init(adreno_dev);
  1380. /* Dump additional AQE 16KB data on top of default 96KB(48(BR)+48(BV)) */
  1381. device->snapshot_ctxt_record_size = ADRENO_FEATURE(adreno_dev, ADRENO_AQE) ?
  1382. 112 * SZ_1K : 96 * SZ_1K;
  1383. return 0;
  1384. }
  1385. /* Register offset defines for Gen7, in order of enum adreno_regs */
  1386. static unsigned int gen7_register_offsets[ADRENO_REG_REGISTER_MAX] = {
  1387. ADRENO_REG_DEFINE(ADRENO_REG_CP_RB_BASE, GEN7_CP_RB_BASE),
  1388. ADRENO_REG_DEFINE(ADRENO_REG_CP_RB_BASE_HI, GEN7_CP_RB_BASE_HI),
  1389. ADRENO_REG_DEFINE(ADRENO_REG_CP_RB_RPTR, GEN7_CP_RB_RPTR),
  1390. ADRENO_REG_DEFINE(ADRENO_REG_CP_RB_WPTR, GEN7_CP_RB_WPTR),
  1391. ADRENO_REG_DEFINE(ADRENO_REG_CP_ME_CNTL, GEN7_CP_SQE_CNTL),
  1392. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB1_BASE, GEN7_CP_IB1_BASE),
  1393. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB1_BASE_HI, GEN7_CP_IB1_BASE_HI),
  1394. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB1_BUFSZ, GEN7_CP_IB1_REM_SIZE),
  1395. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB2_BASE, GEN7_CP_IB2_BASE),
  1396. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB2_BASE_HI, GEN7_CP_IB2_BASE_HI),
  1397. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB2_BUFSZ, GEN7_CP_IB2_REM_SIZE),
  1398. ADRENO_REG_DEFINE(ADRENO_REG_RBBM_STATUS, GEN7_RBBM_STATUS),
  1399. ADRENO_REG_DEFINE(ADRENO_REG_RBBM_STATUS3, GEN7_RBBM_STATUS3),
  1400. ADRENO_REG_DEFINE(ADRENO_REG_RBBM_INT_0_MASK, GEN7_RBBM_INT_0_MASK),
  1401. ADRENO_REG_DEFINE(ADRENO_REG_RBBM_SW_RESET_CMD, GEN7_RBBM_SW_RESET_CMD),
  1402. ADRENO_REG_DEFINE(ADRENO_REG_GMU_AO_HOST_INTERRUPT_MASK,
  1403. GEN7_GMU_AO_HOST_INTERRUPT_MASK),
  1404. ADRENO_REG_DEFINE(ADRENO_REG_GMU_GMU2HOST_INTR_MASK,
  1405. GEN7_GMU_GMU2HOST_INTR_MASK),
  1406. };
  1407. static u32 _get_pipeid(u32 groupid)
  1408. {
  1409. if (groupid == KGSL_PERFCOUNTER_GROUP_BV_TSE || groupid == KGSL_PERFCOUNTER_GROUP_BV_RAS
  1410. || groupid == KGSL_PERFCOUNTER_GROUP_BV_LRZ
  1411. || groupid == KGSL_PERFCOUNTER_GROUP_BV_HLSQ)
  1412. return PIPE_BV;
  1413. else if (groupid == KGSL_PERFCOUNTER_GROUP_HLSQ || groupid == KGSL_PERFCOUNTER_GROUP_TSE
  1414. || groupid == KGSL_PERFCOUNTER_GROUP_RAS
  1415. || groupid == KGSL_PERFCOUNTER_GROUP_LRZ)
  1416. return PIPE_BR;
  1417. else
  1418. return PIPE_NONE;
  1419. }
  1420. int gen7_perfcounter_remove(struct adreno_device *adreno_dev,
  1421. struct adreno_perfcount_register *reg, u32 groupid)
  1422. {
  1423. const struct adreno_perfcounters *counters = ADRENO_PERFCOUNTERS(adreno_dev);
  1424. const struct adreno_perfcount_group *group;
  1425. void *ptr = adreno_dev->pwrup_reglist->hostptr;
  1426. struct cpu_gpu_lock *lock = ptr;
  1427. u32 *data = ptr + sizeof(*lock);
  1428. int offset = (lock->ifpc_list_len + lock->preemption_list_len) * 2;
  1429. int i, second_last_offset, last_offset;
  1430. bool remove_counter = false;
  1431. u32 pipe = FIELD_PREP(GENMASK(13, 12), _get_pipeid(groupid));
  1432. if (!lock->dynamic_list_len)
  1433. return -EINVAL;
  1434. group = &(counters->groups[groupid]);
  1435. if (!(group->flags & ADRENO_PERFCOUNTER_GROUP_RESTORE)) {
  1436. if (lock->dynamic_list_len != 1)
  1437. return 0;
  1438. if (kgsl_hwlock(lock)) {
  1439. kgsl_hwunlock(lock);
  1440. return -EBUSY;
  1441. }
  1442. goto disable_perfcounter;
  1443. }
  1444. second_last_offset = offset + (lock->dynamic_list_len - 2) * 3;
  1445. last_offset = second_last_offset + 3;
  1446. /* Look for the perfcounter to remove in the list */
  1447. for (i = 0; i < lock->dynamic_list_len - 1; i++) {
  1448. if ((data[offset + 1] == reg->select) && (data[offset] == pipe)) {
  1449. remove_counter = true;
  1450. break;
  1451. }
  1452. offset += 3;
  1453. }
  1454. if (!remove_counter)
  1455. return -ENOENT;
  1456. if (kgsl_hwlock(lock)) {
  1457. kgsl_hwunlock(lock);
  1458. return -EBUSY;
  1459. }
  1460. /*
  1461. * If the entry is found, remove it from the list by overwriting with second last
  1462. * entry. Skip this if data at offset is already second last entry
  1463. */
  1464. if (offset != second_last_offset)
  1465. memcpy(&data[offset], &data[second_last_offset], 3 * sizeof(u32));
  1466. /*
  1467. * Overwrite the second last entry with last entry as last entry always has to be
  1468. * GEN7_RBBM_PERFCTR_CNTL.
  1469. */
  1470. memcpy(&data[second_last_offset], &data[last_offset], 3 * sizeof(u32));
  1471. /* Clear the last entry */
  1472. memset(&data[last_offset], 0, 3 * sizeof(u32));
  1473. lock->dynamic_list_len--;
  1474. disable_perfcounter:
  1475. /*
  1476. * If dynamic list length is 1 and no_restore_count is 0, then we can remove the
  1477. * only entry in the list, which is the GEN7_RBBM_PERFCTRL_CNTL.
  1478. */
  1479. if (lock->dynamic_list_len == 1 && !adreno_dev->no_restore_count) {
  1480. memset(&data[offset], 0, 3 * sizeof(u32));
  1481. lock->dynamic_list_len = 0;
  1482. }
  1483. kgsl_hwunlock(lock);
  1484. return 0;
  1485. }
  1486. int gen7_perfcounter_update(struct adreno_device *adreno_dev,
  1487. struct adreno_perfcount_register *reg, bool update_reg, u32 pipe, unsigned long flags)
  1488. {
  1489. void *ptr = adreno_dev->pwrup_reglist->hostptr;
  1490. struct cpu_gpu_lock *lock = ptr;
  1491. u32 *data = ptr + sizeof(*lock);
  1492. int i, offset = (lock->ifpc_list_len + lock->preemption_list_len) * 2;
  1493. bool select_reg_present = false;
  1494. if (flags & ADRENO_PERFCOUNTER_GROUP_RESTORE) {
  1495. for (i = 0; i < lock->dynamic_list_len; i++) {
  1496. if ((data[offset + 1] == reg->select) && (data[offset] == pipe)) {
  1497. select_reg_present = true;
  1498. break;
  1499. }
  1500. if (data[offset + 1] == GEN7_RBBM_PERFCTR_CNTL)
  1501. break;
  1502. offset += 3;
  1503. }
  1504. } else if (lock->dynamic_list_len) {
  1505. goto update;
  1506. }
  1507. if (kgsl_hwlock(lock)) {
  1508. kgsl_hwunlock(lock);
  1509. return -EBUSY;
  1510. }
  1511. /*
  1512. * If the perfcounter select register is already present in reglist
  1513. * update it, otherwise append the <aperture, select register, value>
  1514. * triplet to the end of the list.
  1515. */
  1516. if (select_reg_present) {
  1517. data[offset + 2] = reg->countable;
  1518. kgsl_hwunlock(lock);
  1519. goto update;
  1520. }
  1521. /* Initialize the lock->dynamic_list_len to account for GEN7_RBBM_PERFCTR_CNTL */
  1522. if (!lock->dynamic_list_len)
  1523. lock->dynamic_list_len = 1;
  1524. /*
  1525. * For all targets GEN7_RBBM_PERFCTR_CNTL needs to be the last entry,
  1526. * so overwrite the existing GEN7_RBBM_PERFCTR_CNTL and add it back to
  1527. * the end.
  1528. */
  1529. if (flags & ADRENO_PERFCOUNTER_GROUP_RESTORE) {
  1530. data[offset++] = pipe;
  1531. data[offset++] = reg->select;
  1532. data[offset++] = reg->countable;
  1533. lock->dynamic_list_len++;
  1534. }
  1535. data[offset++] = FIELD_PREP(GENMASK(13, 12), PIPE_NONE);
  1536. data[offset++] = GEN7_RBBM_PERFCTR_CNTL;
  1537. data[offset++] = 1;
  1538. kgsl_hwunlock(lock);
  1539. update:
  1540. if (update_reg)
  1541. kgsl_regwrite(KGSL_DEVICE(adreno_dev), reg->select,
  1542. reg->countable);
  1543. return 0;
  1544. }
  1545. static u64 gen7_9_0_read_alwayson(struct adreno_device *adreno_dev)
  1546. {
  1547. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1548. u32 lo = 0, hi = 0, tmp = 0;
  1549. /* Always use the GMU AO counter when doing a AHB read */
  1550. gmu_core_regread(device, GEN7_GMU_CX_AO_COUNTER_HI, &hi);
  1551. gmu_core_regread(device, GEN7_GMU_CX_AO_COUNTER_LO, &lo);
  1552. /* Check for overflow */
  1553. gmu_core_regread(device, GEN7_GMU_CX_AO_COUNTER_HI, &tmp);
  1554. if (hi != tmp) {
  1555. gmu_core_regread(device, GEN7_GMU_CX_AO_COUNTER_LO,
  1556. &lo);
  1557. hi = tmp;
  1558. }
  1559. return (((u64) hi) << 32) | lo;
  1560. }
  1561. static u64 gen7_read_alwayson(struct adreno_device *adreno_dev)
  1562. {
  1563. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1564. u32 lo = 0, hi = 0, tmp = 0;
  1565. /* Always use the GMU AO counter when doing a AHB read */
  1566. gmu_core_regread(device, GEN7_GMU_ALWAYS_ON_COUNTER_H, &hi);
  1567. gmu_core_regread(device, GEN7_GMU_ALWAYS_ON_COUNTER_L, &lo);
  1568. /* Check for overflow */
  1569. gmu_core_regread(device, GEN7_GMU_ALWAYS_ON_COUNTER_H, &tmp);
  1570. if (hi != tmp) {
  1571. gmu_core_regread(device, GEN7_GMU_ALWAYS_ON_COUNTER_L,
  1572. &lo);
  1573. hi = tmp;
  1574. }
  1575. return (((u64) hi) << 32) | lo;
  1576. }
  1577. static int gen7_9_0_lpac_store(struct adreno_device *adreno_dev, bool enable)
  1578. {
  1579. if (!ADRENO_FEATURE(adreno_dev, ADRENO_LPAC))
  1580. return -EINVAL;
  1581. if (!(adreno_dev->feature_fuse & BIT(GEN7_LPAC_SW_FUSE)) ||
  1582. (adreno_dev->lpac_enabled == enable))
  1583. return 0;
  1584. /* Power down the GPU before changing the lpac setting */
  1585. return adreno_power_cycle_bool(adreno_dev, &adreno_dev->lpac_enabled,
  1586. enable);
  1587. }
  1588. static int gen7_lpac_store(struct adreno_device *adreno_dev, bool enable)
  1589. {
  1590. if (!ADRENO_FEATURE(adreno_dev, ADRENO_LPAC))
  1591. return -EINVAL;
  1592. if (adreno_dev->lpac_enabled == enable)
  1593. return 0;
  1594. /* Power down the GPU before changing the lpac setting */
  1595. return adreno_power_cycle_bool(adreno_dev, &adreno_dev->lpac_enabled,
  1596. enable);
  1597. }
  1598. static void gen7_remove(struct adreno_device *adreno_dev)
  1599. {
  1600. struct gen7_gmu_device *gmu = to_gen7_gmu(adreno_dev);
  1601. /* Make sure timer is initialized, otherwise WARN_ON is generated */
  1602. if (adreno_preemption_feature_set(adreno_dev) &&
  1603. (test_bit(GMU_PRIV_FIRST_BOOT_DONE, &gmu->flags)))
  1604. del_timer(&adreno_dev->preempt.timer);
  1605. }
  1606. static void gen7_read_bus_stats(struct kgsl_device *device,
  1607. struct kgsl_power_stats *stats,
  1608. struct adreno_busy_data *busy)
  1609. {
  1610. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  1611. u64 ram_cycles, starved_ram;
  1612. ram_cycles = counter_delta(device, adreno_dev->ram_cycles_lo,
  1613. &busy->bif_ram_cycles);
  1614. starved_ram = counter_delta(device, adreno_dev->starved_ram_lo,
  1615. &busy->bif_starved_ram);
  1616. ram_cycles += counter_delta(device,
  1617. adreno_dev->ram_cycles_lo_ch1_read,
  1618. &busy->bif_ram_cycles_read_ch1);
  1619. ram_cycles += counter_delta(device,
  1620. adreno_dev->ram_cycles_lo_ch0_write,
  1621. &busy->bif_ram_cycles_write_ch0);
  1622. ram_cycles += counter_delta(device,
  1623. adreno_dev->ram_cycles_lo_ch1_write,
  1624. &busy->bif_ram_cycles_write_ch1);
  1625. starved_ram += counter_delta(device,
  1626. adreno_dev->starved_ram_lo_ch1,
  1627. &busy->bif_starved_ram_ch1);
  1628. stats->ram_time = ram_cycles;
  1629. stats->ram_wait = starved_ram;
  1630. }
  1631. static void gen7_power_stats(struct adreno_device *adreno_dev,
  1632. struct kgsl_power_stats *stats)
  1633. {
  1634. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1635. struct adreno_busy_data *busy = &adreno_dev->busy_data;
  1636. u64 gpu_busy;
  1637. /* Set the GPU busy counter for frequency scaling */
  1638. gpu_busy = counter_delta(device, GEN7_GMU_CX_GMU_POWER_COUNTER_XOCLK_0_L,
  1639. &busy->gpu_busy);
  1640. stats->busy_time = gpu_busy * 10;
  1641. do_div(stats->busy_time, 192);
  1642. if (ADRENO_FEATURE(adreno_dev, ADRENO_IFPC)) {
  1643. u32 ifpc = counter_delta(device,
  1644. GEN7_GMU_CX_GMU_POWER_COUNTER_XOCLK_4_L,
  1645. &busy->num_ifpc);
  1646. adreno_dev->ifpc_count += ifpc;
  1647. if (ifpc > 0)
  1648. trace_adreno_ifpc_count(adreno_dev->ifpc_count);
  1649. }
  1650. if (device->pwrctrl.bus_control)
  1651. gen7_read_bus_stats(device, stats, busy);
  1652. if (adreno_dev->bcl_enabled) {
  1653. u32 a, b, c;
  1654. a = counter_delta(device, GEN7_GMU_CX_GMU_POWER_COUNTER_XOCLK_1_L,
  1655. &busy->throttle_cycles[0]);
  1656. b = counter_delta(device, GEN7_GMU_CX_GMU_POWER_COUNTER_XOCLK_2_L,
  1657. &busy->throttle_cycles[1]);
  1658. c = counter_delta(device, GEN7_GMU_CX_GMU_POWER_COUNTER_XOCLK_3_L,
  1659. &busy->throttle_cycles[2]);
  1660. if (a || b || c)
  1661. trace_kgsl_bcl_clock_throttling(a, b, c);
  1662. if (adreno_is_gen7_2_x_family(adreno_dev)) {
  1663. u32 bcl_throttle = counter_delta(device,
  1664. GEN7_GMU_CX_GMU_POWER_COUNTER_XOCLK_5_L, &busy->bcl_throttle);
  1665. /*
  1666. * This counts number of cycles throttled in XO cycles. Convert it to
  1667. * micro seconds by dividing by XO freq which is 19.2MHz.
  1668. */
  1669. adreno_dev->bcl_throttle_time_us += ((bcl_throttle * 10) / 192);
  1670. }
  1671. }
  1672. }
  1673. static int gen7_setproperty(struct kgsl_device_private *dev_priv,
  1674. u32 type, void __user *value, u32 sizebytes)
  1675. {
  1676. struct kgsl_device *device = dev_priv->device;
  1677. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  1678. u32 enable;
  1679. if (type != KGSL_PROP_PWRCTRL)
  1680. return -ENODEV;
  1681. if (sizebytes != sizeof(enable))
  1682. return -EINVAL;
  1683. if (copy_from_user(&enable, value, sizeof(enable)))
  1684. return -EFAULT;
  1685. mutex_lock(&device->mutex);
  1686. if (enable) {
  1687. clear_bit(GMU_DISABLE_SLUMBER, &device->gmu_core.flags);
  1688. kgsl_pwrscale_enable(device);
  1689. } else {
  1690. set_bit(GMU_DISABLE_SLUMBER, &device->gmu_core.flags);
  1691. if (!adreno_active_count_get(adreno_dev))
  1692. adreno_active_count_put(adreno_dev);
  1693. kgsl_pwrscale_disable(device, true);
  1694. }
  1695. mutex_unlock(&device->mutex);
  1696. return 0;
  1697. }
  1698. static void gen7_set_isdb_breakpoint_registers(struct adreno_device *adreno_dev)
  1699. {
  1700. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1701. struct clk *clk;
  1702. int ret;
  1703. if (!device->set_isdb_breakpoint || device->ftbl->is_hwcg_on(device)
  1704. || device->qdss_gfx_virt == NULL || !device->force_panic)
  1705. return;
  1706. clk = clk_get(&device->pdev->dev, "apb_pclk");
  1707. if (IS_ERR(clk)) {
  1708. dev_err(device->dev, "Unable to get QDSS clock\n");
  1709. goto err;
  1710. }
  1711. ret = clk_prepare_enable(clk);
  1712. if (ret) {
  1713. dev_err(device->dev, "QDSS Clock enable error: %d\n", ret);
  1714. clk_put(clk);
  1715. goto err;
  1716. }
  1717. /* Issue break command for eight SPs */
  1718. isdb_write(device->qdss_gfx_virt, 0x0000);
  1719. isdb_write(device->qdss_gfx_virt, 0x1000);
  1720. isdb_write(device->qdss_gfx_virt, 0x2000);
  1721. isdb_write(device->qdss_gfx_virt, 0x3000);
  1722. isdb_write(device->qdss_gfx_virt, 0x4000);
  1723. isdb_write(device->qdss_gfx_virt, 0x5000);
  1724. isdb_write(device->qdss_gfx_virt, 0x6000);
  1725. isdb_write(device->qdss_gfx_virt, 0x7000);
  1726. /* gen7_2_x has additional SPs */
  1727. if (adreno_is_gen7_2_x_family(adreno_dev)) {
  1728. isdb_write(device->qdss_gfx_virt, 0x8000);
  1729. isdb_write(device->qdss_gfx_virt, 0x9000);
  1730. isdb_write(device->qdss_gfx_virt, 0xa000);
  1731. isdb_write(device->qdss_gfx_virt, 0xb000);
  1732. }
  1733. clk_disable_unprepare(clk);
  1734. clk_put(clk);
  1735. return;
  1736. err:
  1737. /* Do not force kernel panic if isdb writes did not go through */
  1738. device->force_panic = false;
  1739. }
  1740. static void gen7_swfuse_irqctrl(struct adreno_device *adreno_dev, bool state)
  1741. {
  1742. if (adreno_is_gen7_9_x(adreno_dev))
  1743. kgsl_regwrite(KGSL_DEVICE(adreno_dev), GEN7_RBBM_SW_FUSE_INT_MASK,
  1744. state ? GEN7_SW_FUSE_INT_MASK : 0);
  1745. }
  1746. static void gen7_lpac_fault_header(struct adreno_device *adreno_dev,
  1747. struct kgsl_drawobj *drawobj_lpac)
  1748. {
  1749. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1750. struct adreno_context *drawctxt_lpac;
  1751. u32 status = 0, lpac_rptr = 0, lpac_wptr = 0, lpac_ib1sz = 0, lpac_ib2sz = 0;
  1752. u64 lpac_ib1base = 0, lpac_ib2base = 0;
  1753. bool gx_on = adreno_gx_is_on(adreno_dev);
  1754. drawctxt_lpac = ADRENO_CONTEXT(drawobj_lpac->context);
  1755. drawobj_lpac->context->last_faulted_cmd_ts = drawobj_lpac->timestamp;
  1756. drawobj_lpac->context->total_fault_count++;
  1757. pr_context(device, drawobj_lpac->context,
  1758. "LPAC ctx %d ctx_type %s ts %d dispatch_queue=%d\n",
  1759. drawobj_lpac->context->id, kgsl_context_type(drawctxt_lpac->type),
  1760. drawobj_lpac->timestamp, drawobj_lpac->context->gmu_dispatch_queue);
  1761. pr_context(device, drawobj_lpac->context, "lpac cmdline: %s\n",
  1762. drawctxt_lpac->base.proc_priv->cmdline);
  1763. if (!gx_on)
  1764. goto done;
  1765. kgsl_regread(device, GEN7_RBBM_STATUS, &status);
  1766. kgsl_regread(device, GEN7_CP_LPAC_RB_RPTR, &lpac_rptr);
  1767. kgsl_regread(device, GEN7_CP_LPAC_RB_WPTR, &lpac_wptr);
  1768. kgsl_regread64(device, GEN7_CP_LPAC_IB1_BASE_HI,
  1769. GEN7_CP_LPAC_IB1_BASE, &lpac_ib1base);
  1770. kgsl_regread(device, GEN7_CP_LPAC_IB1_REM_SIZE, &lpac_ib1sz);
  1771. kgsl_regread64(device, GEN7_CP_LPAC_IB2_BASE_HI,
  1772. GEN7_CP_LPAC_IB2_BASE, &lpac_ib2base);
  1773. kgsl_regread(device, GEN7_CP_LPAC_IB2_REM_SIZE, &lpac_ib2sz);
  1774. pr_context(device, drawobj_lpac->context,
  1775. "LPAC: status %8.8X rb %4.4x/%4.4x ib1 %16.16llX/%4.4x ib2 %16.16llX/%4.4x\n",
  1776. status, lpac_rptr, lpac_wptr, lpac_ib1base,
  1777. lpac_ib1sz, lpac_ib2base, lpac_ib2sz);
  1778. done:
  1779. trace_adreno_gpu_fault(drawobj_lpac->context->id, drawobj_lpac->timestamp, status,
  1780. lpac_rptr, lpac_wptr, lpac_ib1base, lpac_ib1sz, lpac_ib2base, lpac_ib2sz,
  1781. adreno_get_level(drawobj_lpac->context));
  1782. }
  1783. const struct gen7_gpudev adreno_gen7_9_0_hwsched_gpudev = {
  1784. .base = {
  1785. .reg_offsets = gen7_register_offsets,
  1786. .probe = gen7_hwsched_probe,
  1787. .snapshot = gen7_hwsched_snapshot,
  1788. .irq_handler = gen7_irq_handler,
  1789. .iommu_fault_block = gen7_iommu_fault_block,
  1790. .preemption_context_init = gen7_preemption_context_init,
  1791. .context_detach = gen7_hwsched_context_detach,
  1792. .read_alwayson = gen7_9_0_read_alwayson,
  1793. .reset = gen7_hwsched_reset_replay,
  1794. .power_ops = &gen7_hwsched_power_ops,
  1795. .power_stats = gen7_power_stats,
  1796. .setproperty = gen7_setproperty,
  1797. .hw_isidle = gen7_hw_isidle,
  1798. .add_to_va_minidump = gen7_hwsched_add_to_minidump,
  1799. .gx_is_on = gen7_gmu_gx_is_on,
  1800. .send_recurring_cmdobj = gen7_hwsched_send_recurring_cmdobj,
  1801. .perfcounter_remove = gen7_perfcounter_remove,
  1802. .set_isdb_breakpoint_registers = gen7_set_isdb_breakpoint_registers,
  1803. .context_destroy = gen7_hwsched_context_destroy,
  1804. .lpac_store = gen7_9_0_lpac_store,
  1805. .get_uche_trap_base = gen7_get_uche_trap_base,
  1806. .lpac_fault_header = gen7_lpac_fault_header,
  1807. },
  1808. .hfi_probe = gen7_hwsched_hfi_probe,
  1809. .hfi_remove = gen7_hwsched_hfi_remove,
  1810. .handle_watchdog = gen7_hwsched_handle_watchdog,
  1811. };
  1812. const struct gen7_gpudev adreno_gen7_hwsched_gpudev = {
  1813. .base = {
  1814. .reg_offsets = gen7_register_offsets,
  1815. .probe = gen7_hwsched_probe,
  1816. .snapshot = gen7_hwsched_snapshot,
  1817. .irq_handler = gen7_irq_handler,
  1818. .iommu_fault_block = gen7_iommu_fault_block,
  1819. .preemption_context_init = gen7_preemption_context_init,
  1820. .context_detach = gen7_hwsched_context_detach,
  1821. .read_alwayson = gen7_read_alwayson,
  1822. .reset = gen7_hwsched_reset_replay,
  1823. .power_ops = &gen7_hwsched_power_ops,
  1824. .power_stats = gen7_power_stats,
  1825. .setproperty = gen7_setproperty,
  1826. .hw_isidle = gen7_hw_isidle,
  1827. .add_to_va_minidump = gen7_hwsched_add_to_minidump,
  1828. .gx_is_on = gen7_gmu_gx_is_on,
  1829. .send_recurring_cmdobj = gen7_hwsched_send_recurring_cmdobj,
  1830. .perfcounter_remove = gen7_perfcounter_remove,
  1831. .set_isdb_breakpoint_registers = gen7_set_isdb_breakpoint_registers,
  1832. .context_destroy = gen7_hwsched_context_destroy,
  1833. .lpac_store = gen7_lpac_store,
  1834. .get_uche_trap_base = gen7_get_uche_trap_base,
  1835. .lpac_fault_header = gen7_lpac_fault_header,
  1836. },
  1837. .hfi_probe = gen7_hwsched_hfi_probe,
  1838. .hfi_remove = gen7_hwsched_hfi_remove,
  1839. .handle_watchdog = gen7_hwsched_handle_watchdog,
  1840. };
  1841. const struct gen7_gpudev adreno_gen7_gmu_gpudev = {
  1842. .base = {
  1843. .reg_offsets = gen7_register_offsets,
  1844. .probe = gen7_gmu_device_probe,
  1845. .snapshot = gen7_gmu_snapshot,
  1846. .irq_handler = gen7_irq_handler,
  1847. .rb_start = gen7_rb_start,
  1848. .gpu_keepalive = gen7_gpu_keepalive,
  1849. .hw_isidle = gen7_hw_isidle,
  1850. .iommu_fault_block = gen7_iommu_fault_block,
  1851. .reset = gen7_gmu_reset,
  1852. .preemption_schedule = gen7_preemption_schedule,
  1853. .preemption_context_init = gen7_preemption_context_init,
  1854. .read_alwayson = gen7_read_alwayson,
  1855. .power_ops = &gen7_gmu_power_ops,
  1856. .remove = gen7_remove,
  1857. .ringbuffer_submitcmd = gen7_ringbuffer_submitcmd,
  1858. .power_stats = gen7_power_stats,
  1859. .setproperty = gen7_setproperty,
  1860. .add_to_va_minidump = gen7_gmu_add_to_minidump,
  1861. .gx_is_on = gen7_gmu_gx_is_on,
  1862. .perfcounter_remove = gen7_perfcounter_remove,
  1863. .set_isdb_breakpoint_registers = gen7_set_isdb_breakpoint_registers,
  1864. .swfuse_irqctrl = gen7_swfuse_irqctrl,
  1865. .get_uche_trap_base = gen7_get_uche_trap_base,
  1866. },
  1867. .hfi_probe = gen7_gmu_hfi_probe,
  1868. .handle_watchdog = gen7_gmu_handle_watchdog,
  1869. };