adreno_gen8.c 88 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Copyright (c) 2021, The Linux Foundation. All rights reserved.
  4. * Copyright (c) 2023-2024, Qualcomm Innovation Center, Inc. All rights reserved.
  5. */
  6. #include <linux/debugfs.h>
  7. #include <linux/io.h>
  8. #include <linux/of.h>
  9. #include <linux/of_fdt.h>
  10. #include <linux/of_device.h>
  11. #include <linux/regulator/consumer.h>
  12. #include <linux/soc/qcom/llcc-qcom.h>
  13. #include <soc/qcom/of_common.h>
  14. #include "adreno.h"
  15. #include "adreno_gen8.h"
  16. #include "adreno_gen8_hwsched.h"
  17. #include "adreno_pm4types.h"
  18. #include "adreno_trace.h"
  19. #include "kgsl_pwrscale.h"
  20. #include "kgsl_trace.h"
  21. #include "kgsl_util.h"
  22. /* IFPC & Preemption static powerup restore list */
  23. static const u32 gen8_3_0_pwrup_reglist[] = {
  24. GEN8_UCHE_MODE_CNTL,
  25. GEN8_UCHE_VARB_IDLE_TIMEOUT,
  26. GEN8_UCHE_GBIF_GX_CONFIG,
  27. GEN8_UCHE_CACHE_WAYS,
  28. GEN8_UCHE_CCHE_MODE_CNTL,
  29. GEN8_UCHE_CCHE_CACHE_WAYS,
  30. GEN8_UCHE_CCHE_GC_GMEM_RANGE_MIN_LO,
  31. GEN8_UCHE_CCHE_GC_GMEM_RANGE_MIN_HI,
  32. GEN8_UCHE_WRITE_THRU_BASE_LO,
  33. GEN8_UCHE_WRITE_THRU_BASE_HI,
  34. GEN8_UCHE_TRAP_BASE_LO,
  35. GEN8_UCHE_TRAP_BASE_HI,
  36. GEN8_UCHE_CLIENT_PF,
  37. GEN8_VSC_BIN_SIZE,
  38. GEN8_RB_CMP_NC_MODE_CNTL,
  39. GEN8_SP_HLSQ_TIMEOUT_THRESHOLD_DP,
  40. GEN8_SP_HLSQ_GC_GMEM_RANGE_MIN_LO,
  41. GEN8_SP_HLSQ_GC_GMEM_RANGE_MIN_HI,
  42. GEN8_SP_READ_SEL,
  43. };
  44. /* IFPC only static powerup restore list */
  45. static const u32 gen8_3_0_ifpc_pwrup_reglist[] = {
  46. GEN8_RBBM_NC_MODE_CNTL,
  47. GEN8_RBBM_SLICE_INTERFACE_HANG_INT_CNTL,
  48. GEN8_RBBM_SLICE_NC_MODE_CNTL,
  49. GEN8_SP_NC_MODE_CNTL,
  50. GEN8_SP_CHICKEN_BITS_2,
  51. GEN8_SP_CHICKEN_BITS_3,
  52. GEN8_SP_PERFCTR_SHADER_MASK,
  53. GEN8_TPL1_NC_MODE_CNTL,
  54. GEN8_TPL1_DBG_ECO_CNTL,
  55. GEN8_TPL1_DBG_ECO_CNTL1,
  56. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_1,
  57. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_2,
  58. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_3,
  59. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_4,
  60. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_5,
  61. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_6,
  62. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_7,
  63. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_8,
  64. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_9,
  65. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_10,
  66. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_11,
  67. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_12,
  68. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_13,
  69. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_14,
  70. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_15,
  71. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_16,
  72. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_17,
  73. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_18,
  74. GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_19,
  75. GEN8_CP_PROTECT_REG_GLOBAL,
  76. GEN8_CP_PROTECT_REG_GLOBAL + 1,
  77. GEN8_CP_PROTECT_REG_GLOBAL + 2,
  78. GEN8_CP_PROTECT_REG_GLOBAL + 3,
  79. GEN8_CP_PROTECT_REG_GLOBAL + 4,
  80. GEN8_CP_PROTECT_REG_GLOBAL + 5,
  81. GEN8_CP_PROTECT_REG_GLOBAL + 6,
  82. GEN8_CP_PROTECT_REG_GLOBAL + 7,
  83. GEN8_CP_PROTECT_REG_GLOBAL + 8,
  84. GEN8_CP_PROTECT_REG_GLOBAL + 9,
  85. GEN8_CP_PROTECT_REG_GLOBAL + 10,
  86. GEN8_CP_PROTECT_REG_GLOBAL + 11,
  87. GEN8_CP_PROTECT_REG_GLOBAL + 12,
  88. GEN8_CP_PROTECT_REG_GLOBAL + 13,
  89. GEN8_CP_PROTECT_REG_GLOBAL + 14,
  90. GEN8_CP_PROTECT_REG_GLOBAL + 15,
  91. GEN8_CP_PROTECT_REG_GLOBAL + 16,
  92. GEN8_CP_PROTECT_REG_GLOBAL + 17,
  93. GEN8_CP_PROTECT_REG_GLOBAL + 18,
  94. GEN8_CP_PROTECT_REG_GLOBAL + 19,
  95. GEN8_CP_PROTECT_REG_GLOBAL + 20,
  96. GEN8_CP_PROTECT_REG_GLOBAL + 21,
  97. GEN8_CP_PROTECT_REG_GLOBAL + 22,
  98. GEN8_CP_PROTECT_REG_GLOBAL + 23,
  99. GEN8_CP_PROTECT_REG_GLOBAL + 24,
  100. GEN8_CP_PROTECT_REG_GLOBAL + 25,
  101. GEN8_CP_PROTECT_REG_GLOBAL + 26,
  102. GEN8_CP_PROTECT_REG_GLOBAL + 27,
  103. GEN8_CP_PROTECT_REG_GLOBAL + 28,
  104. GEN8_CP_PROTECT_REG_GLOBAL + 29,
  105. GEN8_CP_PROTECT_REG_GLOBAL + 30,
  106. GEN8_CP_PROTECT_REG_GLOBAL + 31,
  107. GEN8_CP_PROTECT_REG_GLOBAL + 32,
  108. GEN8_CP_PROTECT_REG_GLOBAL + 33,
  109. GEN8_CP_PROTECT_REG_GLOBAL + 34,
  110. GEN8_CP_PROTECT_REG_GLOBAL + 35,
  111. GEN8_CP_PROTECT_REG_GLOBAL + 36,
  112. GEN8_CP_PROTECT_REG_GLOBAL + 37,
  113. GEN8_CP_PROTECT_REG_GLOBAL + 38,
  114. GEN8_CP_PROTECT_REG_GLOBAL + 39,
  115. GEN8_CP_PROTECT_REG_GLOBAL + 40,
  116. GEN8_CP_PROTECT_REG_GLOBAL + 41,
  117. GEN8_CP_PROTECT_REG_GLOBAL + 42,
  118. GEN8_CP_PROTECT_REG_GLOBAL + 43,
  119. GEN8_CP_PROTECT_REG_GLOBAL + 44,
  120. GEN8_CP_PROTECT_REG_GLOBAL + 45,
  121. GEN8_CP_PROTECT_REG_GLOBAL + 63,
  122. };
  123. static const struct gen8_pwrup_extlist gen8_3_0_pwrup_extlist[] = {
  124. { GEN8_CP_PROTECT_CNTL_PIPE, BIT(PIPE_BR) | BIT(PIPE_BV) },
  125. { GEN8_CP_PROTECT_REG_PIPE + 15, BIT(PIPE_BR) | BIT(PIPE_BV) },
  126. { GEN8_GRAS_TSEFE_DBG_ECO_CNTL, BIT(PIPE_BV) | BIT(PIPE_BR)},
  127. { GEN8_GRAS_NC_MODE_CNTL, BIT(PIPE_BV) | BIT(PIPE_BR)},
  128. { GEN8_GRAS_DBG_ECO_CNTL, BIT(PIPE_BV) | BIT(PIPE_BR)},
  129. { GEN8_RB_CCU_CNTL, BIT(PIPE_BR)},
  130. { GEN8_RB_CCU_NC_MODE_CNTL, BIT(PIPE_BR)},
  131. { GEN8_RB_CMP_NC_MODE_CNTL, BIT(PIPE_BR)},
  132. { GEN8_RB_RESOLVE_PREFETCH_CNTL, BIT(PIPE_BR)},
  133. { GEN8_RB_CMP_DBG_ECO_CNTL, BIT(PIPE_BR)},
  134. { GEN8_RB_GC_GMEM_PROTECT, BIT(PIPE_BR)},
  135. { GEN8_RB_CONTEXT_SWITCH_GMEM_SAVE_RESTORE, BIT(PIPE_BR)},
  136. { GEN8_VPC_FLATSHADE_MODE_CNTL, BIT(PIPE_BV) | BIT(PIPE_BR)},
  137. { GEN8_PC_CHICKEN_BITS_1, BIT(PIPE_BV) | BIT(PIPE_BR)},
  138. { GEN8_PC_CHICKEN_BITS_2, BIT(PIPE_BV) | BIT(PIPE_BR)},
  139. { GEN8_PC_CHICKEN_BITS_3, BIT(PIPE_BV) | BIT(PIPE_BR)},
  140. { GEN8_PC_CHICKEN_BITS_4, BIT(PIPE_BV) | BIT(PIPE_BR)},
  141. { GEN8_PC_AUTO_VERTEX_STRIDE, BIT(PIPE_BR) | BIT(PIPE_BV)},
  142. { GEN8_PC_VIS_STREAM_CNTL, BIT(PIPE_BR) | BIT(PIPE_BV)},
  143. { GEN8_PC_CONTEXT_SWITCH_STABILIZE_CNTL_1, BIT(PIPE_BR) | BIT(PIPE_BV)},
  144. { GEN8_VFD_CB_BV_THRESHOLD, BIT(PIPE_BV) | BIT(PIPE_BR)},
  145. { GEN8_VFD_CB_BR_THRESHOLD, BIT(PIPE_BV) | BIT(PIPE_BR)},
  146. { GEN8_VFD_CB_BUSY_REQ_CNT, BIT(PIPE_BV) | BIT(PIPE_BR)},
  147. { GEN8_VFD_CB_LP_REQ_CNT, BIT(PIPE_BV) | BIT(PIPE_BR)},
  148. { GEN8_VFD_DBG_ECO_CNTL, BIT(PIPE_BR) | BIT(PIPE_BV)},
  149. };
  150. struct gen8_nonctxt_overrides gen8_nc_overrides[] = {
  151. { GEN8_UCHE_MODE_CNTL, BIT(PIPE_NONE), 0, 0, 0, },
  152. { GEN8_UCHE_CACHE_WAYS, BIT(PIPE_NONE), 0, 0, 0, },
  153. { GEN8_UCHE_CLIENT_PF, BIT(PIPE_NONE), 0, 0, 0, },
  154. { GEN8_UCHE_DBG_ECO_CNTL_0, BIT(PIPE_NONE), 0, 0, 2, },
  155. { GEN8_UCHE_HW_DBG_CNTL, BIT(PIPE_NONE), 0, 0, 2, },
  156. { GEN8_UCHE_CCHE_HW_DBG_CNTL, BIT(PIPE_NONE), 0, 0, 2, },
  157. { GEN8_GRAS_NC_MODE_CNTL, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  158. { GEN8_GRAS_DBG_ECO_CNTL, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  159. { GEN8_RB_DBG_ECO_CNTL, BIT(PIPE_BR), 0, 0, 3, },
  160. { GEN8_RB_CCU_DBG_ECO_CNTL, BIT(PIPE_BR), 0, 0, 3, },
  161. { GEN8_RB_CCU_CNTL, BIT(PIPE_BR), 0, 0, 0, },
  162. { GEN8_RB_CCU_NC_MODE_CNTL, BIT(PIPE_BR), 0, 0, 0, },
  163. { GEN8_RB_SLICE_UFC_PREFETCH_CNTL, BIT(PIPE_BR), 0, 0, 3, },
  164. { GEN8_RB_SLICE_UFC_DBG_CNTL, BIT(PIPE_BR), 0, 0, 3, },
  165. { GEN8_RB_CMP_NC_MODE_CNTL, BIT(PIPE_BR), 0, 0, 0, },
  166. { GEN8_RB_RESOLVE_PREFETCH_CNTL, BIT(PIPE_BR), 0, 0, 0, },
  167. { GEN8_RB_CMP_DBG_ECO_CNTL, BIT(PIPE_BR), 0, 0, 0, },
  168. { GEN8_RB_UFC_DBG_CNTL, BIT(PIPE_BR), 0, 0, 3, },
  169. { GEN8_PC_CHICKEN_BITS_1, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  170. { GEN8_PC_CHICKEN_BITS_2, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  171. { GEN8_PC_CHICKEN_BITS_3, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  172. { GEN8_PC_CHICKEN_BITS_4, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  173. { GEN8_PC_CHICKEN_BITS_5, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 2, },
  174. { GEN8_PC_DBG_ECO_CNTL, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 3, },
  175. { GEN8_VFD_DBG_ECO_CNTL, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  176. { GEN8_VFD_CB_BV_THRESHOLD, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  177. { GEN8_VFD_CB_BR_THRESHOLD, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  178. { GEN8_VFD_CB_LP_REQ_CNT, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  179. { GEN8_VFD_CB_BUSY_REQ_CNT, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  180. { GEN8_VPC_DBG_ECO_CNTL, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 2, },
  181. { GEN8_VPC_DBG_ECO_CNTL_1, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 2, },
  182. { GEN8_VPC_DBG_ECO_CNTL_2, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 1, },
  183. { GEN8_VPC_DBG_ECO_CNTL_3, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 2, },
  184. { GEN8_VPC_FLATSHADE_MODE_CNTL, BIT(PIPE_BV) | BIT(PIPE_BR), 0, 0, 0, },
  185. { GEN8_SP_DBG_ECO_CNTL, BIT(PIPE_NONE), 0, 0, 1, },
  186. { GEN8_SP_NC_MODE_CNTL, BIT(PIPE_NONE), 0, 0, 0, },
  187. { GEN8_SP_CHICKEN_BITS, BIT(PIPE_NONE), 0, 0, 1, },
  188. { GEN8_SP_NC_MODE_CNTL_2, BIT(PIPE_NONE), 0, 0, 1, },
  189. { GEN8_SP_CHICKEN_BITS_1, BIT(PIPE_NONE), 0, 0, 0, },
  190. { GEN8_SP_CHICKEN_BITS_2, BIT(PIPE_NONE), 0, 0, 0, },
  191. { GEN8_SP_CHICKEN_BITS_3, BIT(PIPE_NONE), 0, 0, 0, },
  192. { GEN8_SP_CHICKEN_BITS_4, BIT(PIPE_NONE), 0, 0, 1, },
  193. { GEN8_SP_DISPATCH_CNTL, BIT(PIPE_NONE), 0, 0, 1, },
  194. { GEN8_SP_HLSQ_DBG_ECO_CNTL, BIT(PIPE_NONE), 0, 0, 1, },
  195. { GEN8_SP_DBG_CNTL, BIT(PIPE_NONE), 0, 0, 1, },
  196. { GEN8_TPL1_NC_MODE_CNTL, BIT(PIPE_NONE), 0, 0, 1, },
  197. { GEN8_TPL1_DBG_ECO_CNTL, BIT(PIPE_NONE), 0, 0, 0, },
  198. { GEN8_TPL1_DBG_ECO_CNTL1, BIT(PIPE_NONE), 0, 0, 0, },
  199. { 0 }
  200. };
  201. static int acd_calibrate_set(void *data, u64 val)
  202. {
  203. struct kgsl_device *device = data;
  204. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  205. struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
  206. u32 debug_val = (u32) val;
  207. int ret;
  208. mutex_lock(&device->mutex);
  209. ret = adreno_active_count_get(adreno_dev);
  210. if (ret)
  211. goto err;
  212. ret = gen8_hfi_send_set_value(adreno_dev, HFI_VALUE_DBG,
  213. F_PWR_ACD_CALIBRATE, debug_val);
  214. if (!ret)
  215. gmu->acd_debug_val = debug_val;
  216. adreno_active_count_put(adreno_dev);
  217. err:
  218. mutex_unlock(&device->mutex);
  219. return ret;
  220. }
  221. static int acd_calibrate_get(void *data, u64 *val)
  222. {
  223. struct kgsl_device *device = data;
  224. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  225. struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
  226. *val = (u64) gmu->acd_debug_val;
  227. return 0;
  228. }
  229. DEFINE_DEBUGFS_ATTRIBUTE(acd_cal_fops, acd_calibrate_get, acd_calibrate_set, "%llu\n");
  230. static ssize_t nc_override_get(struct file *filep,
  231. char __user *user_buf, size_t len, loff_t *off)
  232. {
  233. struct kgsl_device *device = (struct kgsl_device *) filep->private_data;
  234. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  235. struct gen8_device *gen8_dev = container_of(adreno_dev,
  236. struct gen8_device, adreno_dev);
  237. struct gen8_nonctxt_overrides *nc_overrides = gen8_dev->nc_overrides;
  238. u32 i, max_size = PAGE_SIZE;
  239. char *buf, *pos;
  240. ssize_t size = 0;
  241. if (!gen8_dev->nc_overrides_enabled || !nc_overrides)
  242. return 0;
  243. buf = kzalloc(max_size, GFP_KERNEL);
  244. if (!buf)
  245. return -ENOMEM;
  246. pos = buf;
  247. mutex_lock(&gen8_dev->nc_mutex);
  248. /* Copy all assignments from list to str */
  249. for (i = 0; nc_overrides[i].offset; i++) {
  250. if (nc_overrides[i].set) {
  251. len = scnprintf(pos, max_size, "0x%x:0x%8.8x\n",
  252. nc_overrides[i].offset, nc_overrides[i].val);
  253. /* If we run out of space len will be zero */
  254. if (len == 0)
  255. break;
  256. max_size -= len;
  257. pos += len;
  258. }
  259. }
  260. mutex_unlock(&gen8_dev->nc_mutex);
  261. size = simple_read_from_buffer(user_buf, len, off, buf, pos - buf);
  262. kfree(buf);
  263. return size;
  264. }
  265. static void nc_override_cb(struct adreno_device *adreno_dev, void *priv)
  266. {
  267. struct gen8_device *gen8_dev = container_of(adreno_dev, struct gen8_device, adreno_dev);
  268. gen8_dev->nc_overrides_enabled = true;
  269. /* Force to update and make new patched reglist */
  270. adreno_dev->patch_reglist = false;
  271. }
  272. static ssize_t nc_override_set(struct file *filep,
  273. const char __user *user_buf, size_t len, loff_t *off)
  274. {
  275. struct kgsl_device *device = (struct kgsl_device *) filep->private_data;
  276. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  277. struct gen8_device *gen8_dev = container_of(adreno_dev, struct gen8_device, adreno_dev);
  278. struct gen8_nonctxt_overrides *nc_overrides = gen8_dev->nc_overrides;
  279. u32 i, offset, val;
  280. int ret = -EINVAL;
  281. ssize_t size = 0;
  282. char *buf;
  283. if (!nc_overrides)
  284. return 0;
  285. if ((len >= PAGE_SIZE) || (len == 0))
  286. return -EINVAL;
  287. buf = kzalloc(len + 1, GFP_KERNEL);
  288. if (buf == NULL)
  289. return -ENOMEM;
  290. if (copy_from_user(buf, user_buf, len)) {
  291. ret = -EFAULT;
  292. goto err;
  293. }
  294. /* For sanity and parsing, ensure it is null terminated */
  295. buf[len] = '\0';
  296. size = sscanf(buf, "0x%x:0x%x", &offset, &val);
  297. if (size == 0)
  298. goto err;
  299. size = 0;
  300. mutex_lock(&gen8_dev->nc_mutex);
  301. for (i = 0; nc_overrides[i].offset; i++) {
  302. if (nc_overrides[i].offset == offset) {
  303. nc_overrides[i].val = val;
  304. nc_overrides[i].set = true;
  305. size = len;
  306. break;
  307. }
  308. }
  309. mutex_unlock(&gen8_dev->nc_mutex);
  310. if (size > 0) {
  311. ret = adreno_power_cycle(ADRENO_DEVICE(device), nc_override_cb, NULL);
  312. if (!ret)
  313. ret = size;
  314. }
  315. err:
  316. kfree(buf);
  317. return ret;
  318. }
  319. static const struct file_operations nc_override_fops = {
  320. .owner = THIS_MODULE,
  321. .open = simple_open,
  322. .read = nc_override_get,
  323. .write = nc_override_set,
  324. .llseek = noop_llseek,
  325. };
  326. void gen8_cp_init_cmds(struct adreno_device *adreno_dev, u32 *cmds)
  327. {
  328. u32 i = 0, mask = 0;
  329. /* Disable concurrent binning before sending CP init */
  330. cmds[i++] = cp_type7_packet(CP_THREAD_CONTROL, 1);
  331. cmds[i++] = BIT(27);
  332. /* Use multiple HW contexts */
  333. mask |= BIT(0);
  334. /* Enable error detection */
  335. mask |= BIT(1);
  336. /* Set default reset state */
  337. mask |= BIT(3);
  338. /* Disable save/restore of performance counters across preemption */
  339. mask |= BIT(6);
  340. /* Enable the register init list with the spinlock */
  341. mask |= BIT(8);
  342. cmds[i++] = cp_type7_packet(CP_ME_INIT, 7);
  343. /* Enabled ordinal mask */
  344. cmds[i++] = mask;
  345. cmds[i++] = 0x00000003; /* Set number of HW contexts */
  346. cmds[i++] = 0x20000000; /* Enable error detection */
  347. cmds[i++] = 0x00000002; /* Operation mode mask */
  348. /* Register initialization list with spinlock */
  349. cmds[i++] = lower_32_bits(adreno_dev->pwrup_reglist->gpuaddr);
  350. cmds[i++] = upper_32_bits(adreno_dev->pwrup_reglist->gpuaddr);
  351. /*
  352. * Gen8 targets with concurrent binning are expected to have a dynamic
  353. * power up list with triplets which contains the pipe id in it.
  354. * Bit 31 of POWER_UP_REGISTER_LIST_LENGTH is reused here to let CP
  355. * know if the power up contains the triplets. If
  356. * REGISTER_INIT_LIST_WITH_SPINLOCK is set and bit 31 below is set,
  357. * CP expects a dynamic list with triplets.
  358. */
  359. cmds[i++] = BIT(31);
  360. }
  361. int gen8_fenced_write(struct adreno_device *adreno_dev, u32 offset,
  362. u32 value, u32 mask)
  363. {
  364. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  365. const struct adreno_gpudev *gpudev = ADRENO_GPU_DEVICE(adreno_dev);
  366. u32 status, i;
  367. u64 ts1, ts2;
  368. kgsl_regwrite(device, offset, value);
  369. ts1 = gpudev->read_alwayson(adreno_dev);
  370. for (i = 0; i < GMU_CORE_LONG_WAKEUP_RETRY_LIMIT; i++) {
  371. /*
  372. * Make sure the previous register write is posted before
  373. * checking the fence status
  374. */
  375. mb();
  376. gmu_core_regread(device, GEN8_GMUAO_AHB_FENCE_STATUS, &status);
  377. /*
  378. * If !writedropped0/1, then the write to fenced register
  379. * was successful
  380. */
  381. if (!(status & mask))
  382. break;
  383. /* Wait a small amount of time before trying again */
  384. udelay(GMU_CORE_WAKEUP_DELAY_US);
  385. /* Try to write the fenced register again */
  386. kgsl_regwrite(device, offset, value);
  387. }
  388. if (i < GMU_CORE_SHORT_WAKEUP_RETRY_LIMIT)
  389. return 0;
  390. if (i == GMU_CORE_LONG_WAKEUP_RETRY_LIMIT) {
  391. ts2 = gpudev->read_alwayson(adreno_dev);
  392. dev_err(device->dev,
  393. "Timed out waiting %d usecs to write fenced register 0x%x, timestamps: %llx %llx\n",
  394. i * GMU_CORE_WAKEUP_DELAY_US, offset, ts1, ts2);
  395. return -ETIMEDOUT;
  396. }
  397. dev_info(device->dev,
  398. "Waited %d usecs to write fenced register 0x%x\n",
  399. i * GMU_CORE_WAKEUP_DELAY_US, offset);
  400. return 0;
  401. }
  402. int gen8_init(struct adreno_device *adreno_dev)
  403. {
  404. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  405. struct gen8_device *gen8_dev = container_of(adreno_dev,
  406. struct gen8_device, adreno_dev);
  407. const struct adreno_gen8_core *gen8_core = to_gen8_core(adreno_dev);
  408. u64 freq = gen8_core->gmu_hub_clk_freq;
  409. adreno_dev->highest_bank_bit = gen8_core->highest_bank_bit;
  410. adreno_dev->gmu_hub_clk_freq = freq ? freq : 150000000;
  411. adreno_dev->ahb_timeout_val = adreno_get_ahb_timeout_val(adreno_dev,
  412. gen8_core->noc_timeout_us);
  413. adreno_dev->bcl_data = gen8_core->bcl_data;
  414. adreno_dev->cooperative_reset = ADRENO_FEATURE(adreno_dev,
  415. ADRENO_COOP_RESET);
  416. /* If the memory type is DDR 4, override the existing configuration */
  417. if (of_fdt_get_ddrtype() == 0x7)
  418. adreno_dev->highest_bank_bit = 14;
  419. gen8_crashdump_init(adreno_dev);
  420. gen8_dev->nc_overrides = gen8_nc_overrides;
  421. mutex_init(&gen8_dev->nc_mutex);
  422. /* Debugfs node for noncontext registers override */
  423. debugfs_create_file("nc_override", 0644, device->d_debugfs, device, &nc_override_fops);
  424. return adreno_allocate_global(device, &adreno_dev->pwrup_reglist,
  425. PAGE_SIZE, 0, 0, KGSL_MEMDESC_PRIVILEGED,
  426. "powerup_register_list");
  427. }
  428. #define CX_TIMER_INIT_SAMPLES 16
  429. void gen8_cx_timer_init(struct adreno_device *adreno_dev)
  430. {
  431. u64 seed_val, tmr, skew = 0;
  432. int i;
  433. unsigned long flags;
  434. /* Set it up during first boot or after suspend resume */
  435. if (test_bit(ADRENO_DEVICE_CX_TIMER_INITIALIZED, &adreno_dev->priv))
  436. return;
  437. /* Disable irqs to get accurate timings */
  438. local_irq_save(flags);
  439. /* Calculate the overhead of timer reads and register writes */
  440. for (i = 0; i < CX_TIMER_INIT_SAMPLES; i++) {
  441. u64 tmr1, tmr2, tmr3;
  442. /* Measure time for two reads of the CPU timer */
  443. tmr1 = arch_timer_read_counter();
  444. tmr2 = arch_timer_read_counter();
  445. /* Write to the register and time it */
  446. adreno_cx_misc_regwrite(adreno_dev,
  447. GEN8_GPU_CX_MISC_AO_COUNTER_LO,
  448. lower_32_bits(tmr2));
  449. adreno_cx_misc_regwrite(adreno_dev,
  450. GEN8_GPU_CX_MISC_AO_COUNTER_HI,
  451. upper_32_bits(tmr2));
  452. /* Barrier to make sure the write completes before timing it */
  453. mb();
  454. tmr3 = arch_timer_read_counter();
  455. /* Calculate difference between register write and CPU timer */
  456. skew += (tmr3 - tmr2) - (tmr2 - tmr1);
  457. }
  458. local_irq_restore(flags);
  459. /* Get the average over all our readings, to the closest integer */
  460. skew = (skew + CX_TIMER_INIT_SAMPLES / 2) / CX_TIMER_INIT_SAMPLES;
  461. local_irq_save(flags);
  462. tmr = arch_timer_read_counter();
  463. seed_val = tmr + skew;
  464. /* Seed the GPU CX counter with the adjusted timer */
  465. adreno_cx_misc_regwrite(adreno_dev,
  466. GEN8_GPU_CX_MISC_AO_COUNTER_LO, lower_32_bits(seed_val));
  467. adreno_cx_misc_regwrite(adreno_dev,
  468. GEN8_GPU_CX_MISC_AO_COUNTER_HI, upper_32_bits(seed_val));
  469. local_irq_restore(flags);
  470. set_bit(ADRENO_DEVICE_CX_TIMER_INITIALIZED, &adreno_dev->priv);
  471. }
  472. void gen8_get_gpu_feature_info(struct adreno_device *adreno_dev)
  473. {
  474. u32 feature_fuse = 0;
  475. /* Get HW feature soft fuse value */
  476. adreno_cx_misc_regread(adreno_dev, GEN8_GPU_CX_MISC_SW_FUSE_VALUE,
  477. &feature_fuse);
  478. adreno_dev->fastblend_enabled = feature_fuse & BIT(GEN8_FASTBLEND_SW_FUSE);
  479. adreno_dev->raytracing_enabled = feature_fuse & BIT(GEN8_RAYTRACING_SW_FUSE);
  480. /* If software enables LPAC without HW support, disable it */
  481. if (ADRENO_FEATURE(adreno_dev, ADRENO_LPAC))
  482. adreno_dev->lpac_enabled = feature_fuse & BIT(GEN8_LPAC_SW_FUSE);
  483. adreno_dev->feature_fuse = feature_fuse;
  484. }
  485. void gen8_host_aperture_set(struct adreno_device *adreno_dev, u32 pipe_id,
  486. u32 slice_id, u32 use_slice_id)
  487. {
  488. struct gen8_device *gen8_dev = container_of(adreno_dev,
  489. struct gen8_device, adreno_dev);
  490. u32 aperture_val = (FIELD_PREP(GENMASK(15, 12), pipe_id) |
  491. FIELD_PREP(GENMASK(18, 16), slice_id) |
  492. FIELD_PREP(GENMASK(23, 23), use_slice_id));
  493. /* Check if we already set the aperture */
  494. if (gen8_dev->aperture == aperture_val)
  495. return;
  496. kgsl_regwrite(KGSL_DEVICE(adreno_dev), GEN8_CP_APERTURE_CNTL_HOST, aperture_val);
  497. /* Make sure the aperture write goes through before reading the registers */
  498. mb();
  499. gen8_dev->aperture = aperture_val;
  500. }
  501. void gen8_regread64_aperture(struct kgsl_device *device,
  502. u32 offsetwords_lo, u32 offsetwords_hi, u64 *value, u32 pipe,
  503. u32 slice_id, u32 use_slice_id)
  504. {
  505. u32 val_lo = 0, val_hi = 0;
  506. gen8_host_aperture_set(ADRENO_DEVICE(device), pipe, slice_id, use_slice_id);
  507. val_lo = kgsl_regmap_read(&device->regmap, offsetwords_lo);
  508. val_hi = kgsl_regmap_read(&device->regmap, offsetwords_hi);
  509. *value = (((u64)val_hi << 32) | val_lo);
  510. }
  511. void gen8_regread_aperture(struct kgsl_device *device,
  512. u32 offsetwords, u32 *value, u32 pipe, u32 slice_id, u32 use_slice_id)
  513. {
  514. gen8_host_aperture_set(ADRENO_DEVICE(device), pipe, slice_id, use_slice_id);
  515. *value = kgsl_regmap_read(&device->regmap, offsetwords);
  516. }
  517. static inline void gen8_regwrite_aperture(struct kgsl_device *device,
  518. u32 offsetwords, u32 value, u32 pipe, u32 slice_id, u32 use_slice_id)
  519. {
  520. gen8_host_aperture_set(ADRENO_DEVICE(device), pipe, slice_id, use_slice_id);
  521. kgsl_regmap_write(&device->regmap, value, offsetwords);
  522. }
  523. #define GEN8_CP_PROTECT_DEFAULT (FIELD_PREP(GENMASK(31, 16), 0xffff) | BIT(0) | BIT(1) | BIT(3))
  524. static void gen8_protect_init(struct adreno_device *adreno_dev)
  525. {
  526. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  527. const struct adreno_gen8_core *gen8_core = to_gen8_core(adreno_dev);
  528. const struct gen8_protected_regs *regs = gen8_core->protected_regs;
  529. u32 count = 0;
  530. int i;
  531. /*
  532. * Enable access protection to privileged registers, fault on an access
  533. * protect violation and select the last span to protect from the start
  534. * address all the way to the end of the register address space
  535. */
  536. gen8_regwrite_aperture(device, GEN8_CP_PROTECT_CNTL_PIPE,
  537. GEN8_CP_PROTECT_DEFAULT, PIPE_BR, 0, 0);
  538. gen8_regwrite_aperture(device, GEN8_CP_PROTECT_CNTL_PIPE,
  539. GEN8_CP_PROTECT_DEFAULT, PIPE_BV, 0, 0);
  540. if (adreno_dev->lpac_enabled)
  541. gen8_regwrite_aperture(device, GEN8_CP_PROTECT_CNTL_PIPE,
  542. GEN8_CP_PROTECT_DEFAULT, PIPE_LPAC, 0, 0);
  543. /* Clear aperture register */
  544. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  545. /* Program each register defined by the core definition */
  546. for (i = 0; regs[i].reg; i++) {
  547. /*
  548. * This is the offset of the end register as counted from the
  549. * start, i.e. # of registers in the range - 1
  550. */
  551. count = regs[i].end - regs[i].start;
  552. kgsl_regwrite(device, regs[i].reg,
  553. FIELD_PREP(GENMASK(17, 0), regs[i].start) |
  554. FIELD_PREP(GENMASK(30, 18), count) |
  555. FIELD_PREP(BIT(31), regs[i].noaccess));
  556. }
  557. /*
  558. * Last span setting is only being applied to the last pipe specific
  559. * register. Hence duplicate the last span from protect reg into the
  560. * BR, BV and LPAC protect reg pipe 15.
  561. */
  562. i--;
  563. gen8_regwrite_aperture(device, GEN8_CP_PROTECT_REG_PIPE + 15,
  564. FIELD_PREP(GENMASK(17, 0), regs[i].start) |
  565. FIELD_PREP(GENMASK(30, 18), count) |
  566. FIELD_PREP(BIT(31), regs[i].noaccess),
  567. PIPE_BR, 0, 0);
  568. gen8_regwrite_aperture(device, GEN8_CP_PROTECT_REG_PIPE + 15,
  569. FIELD_PREP(GENMASK(17, 0), regs[i].start) |
  570. FIELD_PREP(GENMASK(30, 18), count) |
  571. FIELD_PREP(BIT(31), regs[i].noaccess),
  572. PIPE_BV, 0, 0);
  573. if (adreno_dev->lpac_enabled)
  574. gen8_regwrite_aperture(device, GEN8_CP_PROTECT_REG_PIPE + 15,
  575. FIELD_PREP(GENMASK(17, 0), regs[i].start) |
  576. FIELD_PREP(GENMASK(30, 18), count) |
  577. FIELD_PREP(BIT(31), regs[i].noaccess),
  578. PIPE_LPAC, 0, 0);
  579. /* Clear aperture register */
  580. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  581. }
  582. static void gen8_nonctxt_regconfig(struct adreno_device *adreno_dev)
  583. {
  584. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  585. const struct adreno_gen8_core *gen8_core = to_gen8_core(adreno_dev);
  586. const struct gen8_nonctxt_regs *regs = gen8_core->nonctxt_regs;
  587. struct gen8_device *gen8_dev = container_of(adreno_dev,
  588. struct gen8_device, adreno_dev);
  589. u32 i, pipe_id;
  590. unsigned long pipe;
  591. /* Program non context registers for all pipes */
  592. for (pipe_id = PIPE_NONE; pipe_id <= PIPE_AQE1; pipe_id++) {
  593. if ((pipe_id == PIPE_LPAC) && !ADRENO_FEATURE(adreno_dev, ADRENO_LPAC))
  594. continue;
  595. else if (((pipe_id == PIPE_AQE0) || (pipe_id == PIPE_AQE1)) &&
  596. !ADRENO_FEATURE(adreno_dev, ADRENO_AQE))
  597. continue;
  598. for (i = 0; regs[i].offset; i++) {
  599. pipe = (unsigned long)regs[i].pipelines;
  600. if (test_bit(pipe_id, &pipe))
  601. gen8_regwrite_aperture(device, regs[i].offset,
  602. regs[i].val, pipe_id, 0, 0);
  603. }
  604. }
  605. /* Program non context registers overrides for all pipes */
  606. if (gen8_dev->nc_overrides_enabled) {
  607. struct gen8_nonctxt_overrides *nc_overrides = gen8_dev->nc_overrides;
  608. mutex_lock(&gen8_dev->nc_mutex);
  609. for (pipe_id = PIPE_NONE; pipe_id <= PIPE_AQE1; pipe_id++) {
  610. if ((pipe_id == PIPE_LPAC) && !ADRENO_FEATURE(adreno_dev, ADRENO_LPAC))
  611. continue;
  612. else if (((pipe_id == PIPE_AQE0) || (pipe_id == PIPE_AQE1)) &&
  613. !ADRENO_FEATURE(adreno_dev, ADRENO_AQE))
  614. continue;
  615. for (i = 0; nc_overrides[i].offset; i++) {
  616. if (!nc_overrides[i].set)
  617. continue;
  618. pipe = (unsigned long)nc_overrides[i].pipelines;
  619. if (test_bit(pipe_id, &pipe))
  620. gen8_regwrite_aperture(device, nc_overrides[i].offset,
  621. nc_overrides[i].val, pipe_id, 0, 0);
  622. }
  623. }
  624. mutex_unlock(&gen8_dev->nc_mutex);
  625. }
  626. /* Clear aperture register */
  627. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  628. }
  629. #define RBBM_CLOCK_CNTL_ON 0x8aa8aa82
  630. static void gen8_hwcg_set(struct adreno_device *adreno_dev, bool on)
  631. {
  632. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  633. const struct adreno_gen8_core *gen8_core = to_gen8_core(adreno_dev);
  634. u32 value;
  635. int i;
  636. /* Increase clock keep-on hysteresis from 5 cycles to 8 cycles */
  637. if (!adreno_is_gen8_3_0(adreno_dev) && on)
  638. kgsl_regwrite(device, GEN8_RBBM_CGC_0_PC, 0x00000702);
  639. if (!adreno_dev->hwcg_enabled)
  640. on = false;
  641. for (i = 0; i < gen8_core->ao_hwcg_count; i++)
  642. gmu_core_regwrite(device, gen8_core->ao_hwcg[i].offset,
  643. on ? gen8_core->ao_hwcg[i].val : 0);
  644. kgsl_regwrite(device, GEN8_RBBM_CLOCK_CNTL_GLOBAL, 1);
  645. kgsl_regwrite(device, GEN8_RBBM_CGC_GLOBAL_LOAD_CMD, on ? 1 : 0);
  646. if (on) {
  647. u32 retry = 3;
  648. kgsl_regwrite(device, GEN8_RBBM_CGC_P2S_TRIG_CMD, 1);
  649. /* Poll for the TXDONE:BIT(0) status */
  650. do {
  651. /* Wait for small amount of time for TXDONE status*/
  652. udelay(1);
  653. kgsl_regread(device, GEN8_RBBM_CGC_P2S_STATUS, &value);
  654. } while (!(value & BIT(0)) && --retry);
  655. if (!(value & BIT(0))) {
  656. dev_err(device->dev, "RBBM_CGC_P2S_STATUS:TXDONE Poll failed\n");
  657. kgsl_device_snapshot(device, NULL, NULL, false);
  658. return;
  659. }
  660. kgsl_regwrite(device, GEN8_RBBM_CLOCK_CNTL_GLOBAL, 0);
  661. }
  662. }
  663. static void gen8_patch_pwrup_reglist(struct adreno_device *adreno_dev)
  664. {
  665. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  666. struct gen8_device *gen8_dev = container_of(adreno_dev,
  667. struct gen8_device, adreno_dev);
  668. struct adreno_reglist_list reglist[3];
  669. void *ptr = adreno_dev->pwrup_reglist->hostptr;
  670. struct cpu_gpu_lock *lock = ptr;
  671. u32 items = 0, i, j, pipe_id;
  672. u32 *dest = ptr + sizeof(*lock);
  673. struct gen8_nonctxt_overrides *nc_overrides = gen8_dev->nc_overrides;
  674. /* Static IFPC restore only registers */
  675. reglist[items].regs = gen8_3_0_ifpc_pwrup_reglist;
  676. reglist[items].count = ARRAY_SIZE(gen8_3_0_ifpc_pwrup_reglist);
  677. lock->ifpc_list_len = reglist[items].count;
  678. items++;
  679. /* Static IFPC + preemption registers */
  680. reglist[items].regs = gen8_3_0_pwrup_reglist;
  681. reglist[items].count = ARRAY_SIZE(gen8_3_0_pwrup_reglist);
  682. lock->preemption_list_len = reglist[items].count;
  683. items++;
  684. /*
  685. * For each entry in each of the lists, write the offset and the current
  686. * register value into the GPU buffer
  687. */
  688. for (i = 0; i < items; i++) {
  689. const u32 *r = reglist[i].regs;
  690. for (j = 0; j < reglist[i].count; j++) {
  691. *dest++ = r[j];
  692. kgsl_regread(device, r[j], dest++);
  693. }
  694. mutex_lock(&gen8_dev->nc_mutex);
  695. for (j = 0; j < nc_overrides[j].offset; j++) {
  696. unsigned long pipe = (unsigned long)nc_overrides[j].pipelines;
  697. if (!(test_bit(PIPE_NONE, &pipe) && nc_overrides[j].set &&
  698. nc_overrides[j].list_type))
  699. continue;
  700. if ((reglist[i].regs == gen8_3_0_ifpc_pwrup_reglist) &&
  701. (nc_overrides[j].list_type == 1)) {
  702. *dest++ = nc_overrides[j].offset;
  703. kgsl_regread(device, nc_overrides[j].offset, dest++);
  704. lock->ifpc_list_len++;
  705. } else if ((reglist[i].regs == gen8_3_0_pwrup_reglist) &&
  706. (nc_overrides[j].list_type == 2)) {
  707. *dest++ = nc_overrides[j].offset;
  708. kgsl_regread(device, nc_overrides[j].offset, dest++);
  709. lock->preemption_list_len++;
  710. }
  711. }
  712. mutex_unlock(&gen8_dev->nc_mutex);
  713. }
  714. /*
  715. * The overall register list is composed of
  716. * 1. Static IFPC-only registers
  717. * 2. Static IFPC + preemption registers
  718. * 3. Dynamic IFPC + preemption registers (ex: perfcounter selects)
  719. *
  720. * The first two lists are static. Size of these lists are stored as
  721. * number of pairs in ifpc_list_len and preemption_list_len
  722. * respectively. With concurrent binning, Some of the perfcounter
  723. * registers being virtualized, CP needs to know the pipe id to program
  724. * the aperture inorder to restore the same. Thus, third list is a
  725. * dynamic list with triplets as
  726. * (<aperture, shifted 12 bits> <address> <data>), and the length is
  727. * stored as number for triplets in dynamic_list_len.
  728. *
  729. * Starting with Gen8, some of the registers that are initialized statically
  730. * by the kernel are pipe-specific. Because only the dynamic list is able to
  731. * support specifying a pipe ID, these registers are bundled along with any
  732. * dynamic entries such as perf counter selects into a single dynamic list.
  733. */
  734. gen8_dev->ext_pwrup_list_len = 0;
  735. /*
  736. * Write external pipe specific regs (<aperture> <address> <value> - triplets)
  737. * offset and the current value into GPU buffer
  738. */
  739. for (pipe_id = PIPE_BR; pipe_id <= PIPE_LPAC; pipe_id++) {
  740. for (i = 0; i < ARRAY_SIZE(gen8_3_0_pwrup_extlist); i++) {
  741. unsigned long pipe = (unsigned long)gen8_3_0_pwrup_extlist[i].pipelines;
  742. if (!test_bit(pipe_id, &pipe))
  743. continue;
  744. *dest++ = FIELD_PREP(GENMASK(15, 12), pipe_id);
  745. *dest++ = gen8_3_0_pwrup_extlist[i].offset;
  746. gen8_regread_aperture(device, gen8_3_0_pwrup_extlist[i].offset,
  747. dest++, pipe_id, 0, 0);
  748. gen8_dev->ext_pwrup_list_len++;
  749. }
  750. }
  751. /*
  752. * Write noncontext override pipe specific regs (<aperture> <address> <value> - triplets)
  753. * offset and the current value into GPU buffer
  754. */
  755. mutex_lock(&gen8_dev->nc_mutex);
  756. for (pipe_id = PIPE_BR; pipe_id <= PIPE_BV; pipe_id++) {
  757. for (i = 0; i < nc_overrides[i].offset; i++) {
  758. unsigned long pipe = (unsigned long)nc_overrides[i].pipelines;
  759. if (!(test_bit(pipe_id, &pipe) && nc_overrides[i].set &&
  760. nc_overrides[i].list_type))
  761. continue;
  762. *dest++ = FIELD_PREP(GENMASK(15, 12), pipe_id);
  763. *dest++ = nc_overrides[i].offset;
  764. gen8_regread_aperture(device, nc_overrides[i].offset,
  765. dest++, pipe_id, 0, 0);
  766. gen8_dev->ext_pwrup_list_len++;
  767. }
  768. }
  769. mutex_unlock(&gen8_dev->nc_mutex);
  770. /* Clear aperture register */
  771. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  772. lock->dynamic_list_len = gen8_dev->ext_pwrup_list_len;
  773. }
  774. /* _llc_configure_gpu_scid() - Program the sub-cache ID for all GPU blocks */
  775. static void _llc_configure_gpu_scid(struct adreno_device *adreno_dev)
  776. {
  777. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  778. u32 gpu_scid;
  779. if (IS_ERR_OR_NULL(adreno_dev->gpu_llc_slice) ||
  780. !adreno_dev->gpu_llc_slice_enable)
  781. return;
  782. if (llcc_slice_activate(adreno_dev->gpu_llc_slice))
  783. return;
  784. gpu_scid = llcc_get_slice_id(adreno_dev->gpu_llc_slice);
  785. /* 5 blocks at 6 bits per block */
  786. kgsl_regwrite(device, GEN8_GBIF_SCACHE_CNTL1,
  787. FIELD_PREP(GENMASK(29, 24), gpu_scid) |
  788. FIELD_PREP(GENMASK(23, 18), gpu_scid) |
  789. FIELD_PREP(GENMASK(17, 12), gpu_scid) |
  790. FIELD_PREP(GENMASK(11, 6), gpu_scid) |
  791. FIELD_PREP(GENMASK(5, 0), gpu_scid));
  792. kgsl_regwrite(device, GEN8_GBIF_SCACHE_CNTL0,
  793. FIELD_PREP(GENMASK(15, 10), gpu_scid) |
  794. FIELD_PREP(GENMASK(21, 16), gpu_scid) |
  795. FIELD_PREP(GENMASK(27, 22), gpu_scid) | BIT(8));
  796. }
  797. static void _llc_gpuhtw_slice_activate(struct adreno_device *adreno_dev)
  798. {
  799. if (IS_ERR_OR_NULL(adreno_dev->gpuhtw_llc_slice) ||
  800. !adreno_dev->gpuhtw_llc_slice_enable)
  801. return;
  802. llcc_slice_activate(adreno_dev->gpuhtw_llc_slice);
  803. }
  804. static void _set_secvid(struct kgsl_device *device)
  805. {
  806. kgsl_regwrite(device, GEN8_RBBM_SECVID_TSB_CNTL, 0x0);
  807. kgsl_regwrite(device, GEN8_RBBM_SECVID_TSB_TRUSTED_BASE_LO,
  808. lower_32_bits(KGSL_IOMMU_SECURE_BASE32));
  809. kgsl_regwrite(device, GEN8_RBBM_SECVID_TSB_TRUSTED_BASE_HI,
  810. upper_32_bits(KGSL_IOMMU_SECURE_BASE32));
  811. kgsl_regwrite(device, GEN8_RBBM_SECVID_TSB_TRUSTED_SIZE,
  812. FIELD_PREP(GENMASK(31, 12),
  813. (KGSL_IOMMU_SECURE_SIZE(&device->mmu) / SZ_4K)));
  814. }
  815. /* Set UCHE_TRAP_BASE to a page below the top of the memory space */
  816. #define GEN8_UCHE_TRAP_BASE 0x1FFFFFFFFF000ULL
  817. static u64 gen8_get_uche_trap_base(void)
  818. {
  819. return GEN8_UCHE_TRAP_BASE;
  820. }
  821. /*
  822. * All Gen8 targets support marking certain transactions as always privileged
  823. * which allows us to mark more memory as privileged without having to
  824. * explicitly set the APRIV bit. Choose the following transactions to be
  825. * privileged by default:
  826. * CDWRITE [6:6] - Crashdumper writes
  827. * CDREAD [5:5] - Crashdumper reads
  828. * RBRPWB [3:3] - RPTR shadow writes
  829. * RBPRIVLEVEL [2:2] - Memory accesses from PM4 packets in the ringbuffer
  830. * RBFETCH [1:1] - Ringbuffer reads
  831. * ICACHE [0:0] - Instruction cache fetches
  832. */
  833. #define GEN8_APRIV_DEFAULT (BIT(3) | BIT(2) | BIT(1) | BIT(0))
  834. /* Add crashdumper permissions for the BR APRIV */
  835. #define GEN8_BR_APRIV_DEFAULT (GEN8_APRIV_DEFAULT | BIT(6) | BIT(5))
  836. static const struct kgsl_regmap_list gen8_3_0_bicubic_regs[] = {
  837. /*GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_0 default and recomended values are same */
  838. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_1, 0x3fe05ff4 },
  839. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_2, 0x3fa0ebee },
  840. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_3, 0x3f5193ed },
  841. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_4, 0x3f0243f0 },
  842. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_5, 0x00000000 },
  843. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_6, 0x3fd093e8 },
  844. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_7, 0x3f4133dc },
  845. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_8, 0x3ea1dfdb },
  846. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_9, 0x3e0283e0 },
  847. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_10, 0x0000ac2b },
  848. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_11, 0x0000f01d },
  849. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_12, 0x00114412 },
  850. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_13, 0x0021980a },
  851. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_14, 0x0051ec05 },
  852. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_15, 0x0000380e },
  853. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_16, 0x3ff09001 },
  854. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_17, 0x3fc10bfa },
  855. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_18, 0x3f9193f7 },
  856. { GEN8_TPL1_BICUBIC_WEIGHTS_TABLE_19, 0x3f7227f7 },
  857. };
  858. void gen8_enable_ahb_timeout_detection(struct adreno_device *adreno_dev)
  859. {
  860. u32 val;
  861. if (!adreno_dev->ahb_timeout_val)
  862. return;
  863. val = (ADRENO_AHB_CNTL_DEFAULT | FIELD_PREP(GENMASK(4, 0),
  864. adreno_dev->ahb_timeout_val));
  865. adreno_cx_misc_regwrite(adreno_dev, GEN8_GPU_CX_MISC_CX_AHB_AON_CNTL, val);
  866. adreno_cx_misc_regwrite(adreno_dev, GEN8_GPU_CX_MISC_CX_AHB_GMU_CNTL, val);
  867. adreno_cx_misc_regwrite(adreno_dev, GEN8_GPU_CX_MISC_CX_AHB_CP_CNTL, val);
  868. adreno_cx_misc_regwrite(adreno_dev, GEN8_GPU_CX_MISC_CX_AHB_VBIF_SMMU_CNTL, val);
  869. adreno_cx_misc_regwrite(adreno_dev, GEN8_GPU_CX_MISC_CX_AHB_HOST_CNTL, val);
  870. }
  871. #define MIN_HBB 13
  872. int gen8_start(struct adreno_device *adreno_dev)
  873. {
  874. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  875. const struct adreno_gen8_core *gen8_core = to_gen8_core(adreno_dev);
  876. u32 mal, mode = 0, mode2 = 0, rgb565_predicator = 0, amsbc = 0;
  877. struct gen8_device *gen8_dev = container_of(adreno_dev,
  878. struct gen8_device, adreno_dev);
  879. /*
  880. * HBB values 13 to 16 can represented LSB of HBB from 0 to 3.
  881. * Any HBB value beyond 16 needs programming MSB of HBB.
  882. * By default highest bank bit is 14, Hence set default HBB LSB
  883. * to "1" and MSB to "0".
  884. */
  885. u32 hbb_lo = 1, hbb_hi = 0, hbb = 1;
  886. struct cpu_gpu_lock *pwrup_lock = adreno_dev->pwrup_reglist->hostptr;
  887. u64 uche_trap_base = gen8_get_uche_trap_base();
  888. u32 rgba8888_lossless = 0, fp16compoptdis = 0;
  889. /* Reset aperture fields to go through first aperture write check */
  890. gen8_dev->aperture = UINT_MAX;
  891. /* Make all blocks contribute to the GPU BUSY perf counter */
  892. kgsl_regwrite(device, GEN8_RBBM_PERFCTR_GPU_BUSY_MASKED, 0xffffffff);
  893. kgsl_regwrite(device, GEN8_UCHE_CCHE_GC_GMEM_RANGE_MIN_LO,
  894. lower_32_bits(adreno_dev->uche_gmem_base));
  895. kgsl_regwrite(device, GEN8_UCHE_CCHE_GC_GMEM_RANGE_MIN_HI,
  896. upper_32_bits(adreno_dev->uche_gmem_base));
  897. kgsl_regwrite(device, GEN8_SP_HLSQ_GC_GMEM_RANGE_MIN_LO,
  898. lower_32_bits(adreno_dev->uche_gmem_base));
  899. kgsl_regwrite(device, GEN8_SP_HLSQ_GC_GMEM_RANGE_MIN_HI,
  900. upper_32_bits(adreno_dev->uche_gmem_base));
  901. if (adreno_dev->lpac_enabled) {
  902. gen8_regwrite_aperture(device, GEN8_RB_LPAC_GMEM_PROTECT,
  903. 0x0c000000, PIPE_BR, 0, 0);
  904. /* Clear aperture register */
  905. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  906. kgsl_regwrite(device, GEN8_UCHE_CCHE_LPAC_GMEM_RANGE_MIN_LO,
  907. lower_32_bits(adreno_dev->uche_gmem_base));
  908. kgsl_regwrite(device, GEN8_UCHE_CCHE_LPAC_GMEM_RANGE_MIN_HI,
  909. upper_32_bits(adreno_dev->uche_gmem_base));
  910. kgsl_regwrite(device, GEN8_SP_HLSQ_LPAC_GMEM_RANGE_MIN_LO,
  911. lower_32_bits(adreno_dev->uche_gmem_base));
  912. kgsl_regwrite(device, GEN8_SP_HLSQ_LPAC_GMEM_RANGE_MIN_HI,
  913. upper_32_bits(adreno_dev->uche_gmem_base));
  914. }
  915. /*
  916. * Set UCHE_WRITE_THRU_BASE to the UCHE_TRAP_BASE effectively
  917. * disabling L2 bypass
  918. */
  919. kgsl_regwrite(device, GEN8_UCHE_TRAP_BASE_LO, lower_32_bits(uche_trap_base));
  920. kgsl_regwrite(device, GEN8_UCHE_TRAP_BASE_HI, upper_32_bits(uche_trap_base));
  921. kgsl_regwrite(device, GEN8_UCHE_WRITE_THRU_BASE_LO, lower_32_bits(uche_trap_base));
  922. kgsl_regwrite(device, GEN8_UCHE_WRITE_THRU_BASE_HI, upper_32_bits(uche_trap_base));
  923. /*
  924. * CP takes care of the restore during IFPC exit. We need to restore at slumber
  925. * boundary as well
  926. */
  927. if (pwrup_lock->dynamic_list_len - gen8_dev->ext_pwrup_list_len > 0) {
  928. kgsl_regwrite(device, GEN8_RBBM_PERFCTR_CNTL, 0x1);
  929. kgsl_regwrite(device, GEN8_RBBM_SLICE_PERFCTR_CNTL, 0x1);
  930. }
  931. /* Turn on the IFPC counter (countable 4 on XOCLK4) */
  932. kgsl_regwrite(device, GEN8_GMUCX_POWER_COUNTER_SELECT_XOCLK_1,
  933. FIELD_PREP(GENMASK(7, 0), 0x4));
  934. /* Turn on counter to count total time spent in BCL throttle */
  935. if (adreno_dev->bcl_enabled)
  936. kgsl_regrmw(device, GEN8_GMUCX_POWER_COUNTER_SELECT_XOCLK_1, GENMASK(15, 8),
  937. FIELD_PREP(GENMASK(15, 8), 0x26));
  938. if (of_property_read_u32(device->pdev->dev.of_node, "qcom,min-access-length", &mal))
  939. mal = 32;
  940. of_property_read_u32(device->pdev->dev.of_node, "qcom,ubwc-mode", &mode);
  941. switch (mode) {
  942. case KGSL_UBWC_5_0:
  943. amsbc = 1;
  944. rgb565_predicator = 1;
  945. mode2 = 4;
  946. break;
  947. case KGSL_UBWC_4_0:
  948. amsbc = 1;
  949. rgb565_predicator = 1;
  950. fp16compoptdis = 1;
  951. rgba8888_lossless = 1;
  952. mode2 = 2;
  953. break;
  954. case KGSL_UBWC_3_0:
  955. amsbc = 1;
  956. mode2 = 1;
  957. break;
  958. default:
  959. break;
  960. }
  961. if (!WARN_ON(!adreno_dev->highest_bank_bit)) {
  962. hbb = adreno_dev->highest_bank_bit - MIN_HBB;
  963. hbb_lo = hbb & 3;
  964. hbb_hi = (hbb >> 2) & 1;
  965. }
  966. mal = (mal == 64) ? 1 : 0;
  967. gen8_regwrite_aperture(device, GEN8_GRAS_NC_MODE_CNTL,
  968. FIELD_PREP(GENMASK(8, 5), hbb), PIPE_BV, 0, 0);
  969. gen8_regwrite_aperture(device, GEN8_GRAS_NC_MODE_CNTL,
  970. FIELD_PREP(GENMASK(8, 5), hbb), PIPE_BR, 0, 0);
  971. gen8_regwrite_aperture(device, GEN8_RB_CCU_NC_MODE_CNTL,
  972. FIELD_PREP(GENMASK(3, 3), hbb_hi) |
  973. FIELD_PREP(GENMASK(2, 1), hbb_lo),
  974. PIPE_BR, 0, 0);
  975. gen8_regwrite_aperture(device, GEN8_RB_CMP_NC_MODE_CNTL,
  976. FIELD_PREP(GENMASK(17, 15), mode2) |
  977. FIELD_PREP(GENMASK(4, 4), rgba8888_lossless) |
  978. FIELD_PREP(GENMASK(3, 3), fp16compoptdis) |
  979. FIELD_PREP(GENMASK(2, 2), rgb565_predicator) |
  980. FIELD_PREP(GENMASK(1, 1), amsbc) |
  981. FIELD_PREP(GENMASK(0, 0), mal),
  982. PIPE_BR, 0, 0);
  983. /* Clear aperture register */
  984. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  985. kgsl_regwrite(device, GEN8_SP_NC_MODE_CNTL,
  986. FIELD_PREP(GENMASK(11, 10), hbb_hi) |
  987. FIELD_PREP(GENMASK(5, 4), 2) |
  988. FIELD_PREP(GENMASK(3, 3), mal) |
  989. FIELD_PREP(GENMASK(2, 1), hbb_lo));
  990. kgsl_regwrite(device, GEN8_TPL1_NC_MODE_CNTL,
  991. FIELD_PREP(GENMASK(4, 4), hbb_hi) |
  992. FIELD_PREP(GENMASK(3, 3), mal) |
  993. FIELD_PREP(GENMASK(2, 1), hbb_lo));
  994. /* Configure TP bicubic registers */
  995. kgsl_regmap_multi_write(&device->regmap, gen8_3_0_bicubic_regs,
  996. ARRAY_SIZE(gen8_3_0_bicubic_regs));
  997. /* Program noncontext registers */
  998. gen8_nonctxt_regconfig(adreno_dev);
  999. /* Enable hardware hang detection */
  1000. kgsl_regwrite(device, GEN8_RBBM_INTERFACE_HANG_INT_CNTL, BIT(30) |
  1001. FIELD_PREP(GENMASK(27, 0), gen8_core->hang_detect_cycles));
  1002. kgsl_regwrite(device, GEN8_RBBM_SLICE_INTERFACE_HANG_INT_CNTL, BIT(30));
  1003. kgsl_regwrite(device, GEN8_UCHE_CLIENT_PF, BIT(7) |
  1004. FIELD_PREP(GENMASK(6, 0), adreno_dev->uche_client_pf));
  1005. /* Enable the GMEM save/restore feature for preemption */
  1006. if (adreno_is_preemption_enabled(adreno_dev)) {
  1007. gen8_regwrite_aperture(device,
  1008. GEN8_RB_CONTEXT_SWITCH_GMEM_SAVE_RESTORE,
  1009. 0x1, PIPE_BR, 0, 0);
  1010. /* Clear aperture register */
  1011. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  1012. }
  1013. /* Enable GMU power counter 0 to count GPU busy */
  1014. kgsl_regwrite(device, GEN8_GMUAO_GPU_CX_BUSY_MASK, 0xff000000);
  1015. kgsl_regrmw(device, GEN8_GMUCX_POWER_COUNTER_SELECT_XOCLK_0, 0xFF, 0x20);
  1016. kgsl_regwrite(device, GEN8_GMUCX_POWER_COUNTER_ENABLE, 0x1);
  1017. gen8_protect_init(adreno_dev);
  1018. /* Configure LLCC */
  1019. _llc_configure_gpu_scid(adreno_dev);
  1020. _llc_gpuhtw_slice_activate(adreno_dev);
  1021. gen8_regwrite_aperture(device, GEN8_CP_APRIV_CNTL_PIPE,
  1022. GEN8_BR_APRIV_DEFAULT, PIPE_BR, 0, 0);
  1023. gen8_regwrite_aperture(device, GEN8_CP_APRIV_CNTL_PIPE,
  1024. GEN8_APRIV_DEFAULT, PIPE_BV, 0, 0);
  1025. if (adreno_dev->lpac_enabled)
  1026. gen8_regwrite_aperture(device, GEN8_CP_APRIV_CNTL_PIPE,
  1027. GEN8_APRIV_DEFAULT, PIPE_LPAC, 0, 0);
  1028. if (ADRENO_FEATURE(adreno_dev, ADRENO_AQE)) {
  1029. gen8_regwrite_aperture(device, GEN8_CP_APRIV_CNTL_PIPE,
  1030. GEN8_APRIV_DEFAULT, PIPE_AQE0, 0, 0);
  1031. gen8_regwrite_aperture(device, GEN8_CP_APRIV_CNTL_PIPE,
  1032. GEN8_APRIV_DEFAULT, PIPE_AQE1, 0, 0);
  1033. }
  1034. /* Clear aperture register */
  1035. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  1036. _set_secvid(device);
  1037. /*
  1038. * Enable hardware clock gating here to prevent any register access
  1039. * issue due to internal clock gating.
  1040. */
  1041. gen8_hwcg_set(adreno_dev, true);
  1042. /*
  1043. * All registers must be written before this point so that we don't
  1044. * miss any register programming when we patch the power up register
  1045. * list.
  1046. */
  1047. if (!adreno_dev->patch_reglist &&
  1048. (adreno_dev->pwrup_reglist->gpuaddr != 0)) {
  1049. gen8_patch_pwrup_reglist(adreno_dev);
  1050. adreno_dev->patch_reglist = true;
  1051. }
  1052. return 0;
  1053. }
  1054. /* Offsets into the MX/CX mapped register regions */
  1055. #define GEN8_RDPM_MX_OFFSET 0xf00
  1056. #define GEN8_RDPM_CX_OFFSET 0xf14
  1057. void gen8_rdpm_mx_freq_update(struct gen8_gmu_device *gmu, u32 freq)
  1058. {
  1059. if (gmu->rdpm_mx_virt) {
  1060. writel_relaxed(freq/1000, (gmu->rdpm_mx_virt + GEN8_RDPM_MX_OFFSET));
  1061. /*
  1062. * ensure previous writes post before this one,
  1063. * i.e. act like normal writel()
  1064. */
  1065. wmb();
  1066. }
  1067. }
  1068. void gen8_rdpm_cx_freq_update(struct gen8_gmu_device *gmu, u32 freq)
  1069. {
  1070. if (gmu->rdpm_cx_virt) {
  1071. writel_relaxed(freq/1000, (gmu->rdpm_cx_virt + GEN8_RDPM_CX_OFFSET));
  1072. /*
  1073. * ensure previous writes post before this one,
  1074. * i.e. act like normal writel()
  1075. */
  1076. wmb();
  1077. }
  1078. }
  1079. int gen8_scm_gpu_init_cx_regs(struct adreno_device *adreno_dev)
  1080. {
  1081. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1082. u32 gpu_req = GPU_ALWAYS_EN_REQ;
  1083. int ret;
  1084. if (ADRENO_FEATURE(adreno_dev, ADRENO_BCL))
  1085. gpu_req |= GPU_BCL_EN_REQ;
  1086. if (ADRENO_FEATURE(adreno_dev, ADRENO_CLX))
  1087. gpu_req |= GPU_CLX_EN_REQ;
  1088. gpu_req |= GPU_TSENSE_EN_REQ;
  1089. ret = kgsl_scm_gpu_init_regs(&device->pdev->dev, gpu_req);
  1090. /*
  1091. * For targets that support this scm call to program BCL id , enable BCL.
  1092. * For other targets, BCL is enabled after first GMU boot.
  1093. */
  1094. if (!ret && ADRENO_FEATURE(adreno_dev, ADRENO_BCL))
  1095. adreno_dev->bcl_enabled = true;
  1096. /* If programming TZ CLX was successful, then program KMD owned CLX regs */
  1097. if (!ret && ADRENO_FEATURE(adreno_dev, ADRENO_CLX))
  1098. adreno_dev->clx_enabled = true;
  1099. /*
  1100. * If scm call returned EOPNOTSUPP, either we are on a kernel version
  1101. * lesser than 6.1 where scm call is not supported or we are sending an
  1102. * empty request. Ignore the error in such cases.
  1103. */
  1104. return (ret == -EOPNOTSUPP) ? 0 : ret;
  1105. }
  1106. void gen8_spin_idle_debug(struct adreno_device *adreno_dev,
  1107. const char *str)
  1108. {
  1109. struct kgsl_device *device = &adreno_dev->dev;
  1110. u32 rptr, wptr, status, intstatus, global_status;
  1111. dev_err(device->dev, str);
  1112. kgsl_regread(device, GEN8_CP_RB_RPTR_BR, &rptr);
  1113. kgsl_regread(device, GEN8_CP_RB_WPTR_GC, &wptr);
  1114. kgsl_regread(device, GEN8_RBBM_STATUS, &status);
  1115. kgsl_regread(device, GEN8_RBBM_INT_0_STATUS, &intstatus);
  1116. kgsl_regread(device, GEN8_CP_INTERRUPT_STATUS_GLOBAL, &global_status);
  1117. dev_err(device->dev,
  1118. "rb=%d pos=%X/%X rbbm_status=%8.8X int_0_status=%8.8X global_status=%8.8X\n",
  1119. adreno_dev->cur_rb ? adreno_dev->cur_rb->id : -1, rptr, wptr,
  1120. status, intstatus, global_status);
  1121. kgsl_device_snapshot(device, NULL, NULL, false);
  1122. }
  1123. /*
  1124. * gen8_send_cp_init() - Initialize ringbuffer
  1125. * @adreno_dev: Pointer to adreno device
  1126. * @rb: Pointer to the ringbuffer of device
  1127. *
  1128. * Submit commands for ME initialization,
  1129. */
  1130. static int gen8_send_cp_init(struct adreno_device *adreno_dev,
  1131. struct adreno_ringbuffer *rb)
  1132. {
  1133. u32 *cmds;
  1134. int ret;
  1135. cmds = adreno_ringbuffer_allocspace(rb, GEN8_CP_INIT_DWORDS);
  1136. if (IS_ERR(cmds))
  1137. return PTR_ERR(cmds);
  1138. gen8_cp_init_cmds(adreno_dev, cmds);
  1139. ret = gen8_ringbuffer_submit(rb, NULL);
  1140. if (ret)
  1141. return ret;
  1142. ret = adreno_spin_idle(adreno_dev, 2000);
  1143. if (ret) {
  1144. gen8_spin_idle_debug(adreno_dev,
  1145. "CP initialization failed to idle\n");
  1146. rb->wptr = 0;
  1147. rb->_wptr = 0;
  1148. }
  1149. return ret;
  1150. }
  1151. static int gen8_post_start(struct adreno_device *adreno_dev)
  1152. {
  1153. int ret;
  1154. u32 *cmds;
  1155. struct adreno_ringbuffer *rb = adreno_dev->cur_rb;
  1156. struct adreno_preemption *preempt = &adreno_dev->preempt;
  1157. u64 kmd_postamble_addr;
  1158. if (!adreno_is_preemption_enabled(adreno_dev))
  1159. return 0;
  1160. kmd_postamble_addr = SCRATCH_POSTAMBLE_ADDR(KGSL_DEVICE(adreno_dev));
  1161. gen8_preemption_prepare_postamble(adreno_dev);
  1162. cmds = adreno_ringbuffer_allocspace(rb,
  1163. (preempt->postamble_bootup_len ? 16 : 12));
  1164. if (IS_ERR(cmds))
  1165. return PTR_ERR(cmds);
  1166. *cmds++ = cp_type7_packet(CP_SET_PSEUDO_REGISTER, 6);
  1167. *cmds++ = SET_PSEUDO_PRIV_NON_SECURE_SAVE_ADDR;
  1168. *cmds++ = lower_32_bits(rb->preemption_desc->gpuaddr);
  1169. *cmds++ = upper_32_bits(rb->preemption_desc->gpuaddr);
  1170. *cmds++ = SET_PSEUDO_PRIV_SECURE_SAVE_ADDR;
  1171. *cmds++ = lower_32_bits(rb->secure_preemption_desc->gpuaddr);
  1172. *cmds++ = upper_32_bits(rb->secure_preemption_desc->gpuaddr);
  1173. if (preempt->postamble_bootup_len) {
  1174. *cmds++ = cp_type7_packet(CP_SET_AMBLE, 3);
  1175. *cmds++ = lower_32_bits(kmd_postamble_addr);
  1176. *cmds++ = upper_32_bits(kmd_postamble_addr);
  1177. *cmds++ = FIELD_PREP(GENMASK(22, 20), CP_KMD_AMBLE_TYPE)
  1178. | (FIELD_PREP(GENMASK(19, 0),
  1179. adreno_dev->preempt.postamble_bootup_len));
  1180. }
  1181. *cmds++ = cp_type7_packet(CP_CONTEXT_SWITCH_YIELD, 4);
  1182. *cmds++ = 0;
  1183. *cmds++ = 0;
  1184. *cmds++ = 0;
  1185. /* generate interrupt on preemption completion */
  1186. *cmds++ = 0;
  1187. ret = gen8_ringbuffer_submit(rb, NULL);
  1188. if (!ret) {
  1189. ret = adreno_spin_idle(adreno_dev, 2000);
  1190. if (ret)
  1191. gen8_spin_idle_debug(adreno_dev,
  1192. "hw preemption initialization failed to idle\n");
  1193. }
  1194. return ret;
  1195. }
  1196. int gen8_rb_start(struct adreno_device *adreno_dev)
  1197. {
  1198. const struct adreno_gen8_core *gen8_core = to_gen8_core(adreno_dev);
  1199. struct adreno_firmware *fw = ADRENO_FW(adreno_dev, ADRENO_FW_SQE);
  1200. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1201. struct adreno_ringbuffer *rb;
  1202. u64 addr;
  1203. int ret, i;
  1204. u32 *cmds;
  1205. /* Clear all the ringbuffers */
  1206. FOR_EACH_RINGBUFFER(adreno_dev, rb, i) {
  1207. memset(rb->buffer_desc->hostptr, 0xaa, KGSL_RB_SIZE);
  1208. kgsl_sharedmem_writel(device->scratch,
  1209. SCRATCH_RB_OFFSET(rb->id, rptr), 0);
  1210. kgsl_sharedmem_writel(device->scratch,
  1211. SCRATCH_RB_OFFSET(rb->id, bv_rptr), 0);
  1212. rb->wptr = 0;
  1213. rb->_wptr = 0;
  1214. rb->wptr_preempt_end = UINT_MAX;
  1215. }
  1216. gen8_preemption_start(adreno_dev);
  1217. /* Set up the current ringbuffer */
  1218. rb = ADRENO_CURRENT_RINGBUFFER(adreno_dev);
  1219. addr = SCRATCH_RB_GPU_ADDR(device, rb->id, rptr);
  1220. kgsl_regwrite(device, GEN8_CP_RB_RPTR_ADDR_LO_BR, lower_32_bits(addr));
  1221. kgsl_regwrite(device, GEN8_CP_RB_RPTR_ADDR_HI_BR, upper_32_bits(addr));
  1222. addr = SCRATCH_RB_GPU_ADDR(device, rb->id, bv_rptr);
  1223. kgsl_regwrite(device, GEN8_CP_RB_RPTR_ADDR_LO_BV, lower_32_bits(addr));
  1224. kgsl_regwrite(device, GEN8_CP_RB_RPTR_ADDR_HI_BV, upper_32_bits(addr));
  1225. kgsl_regwrite(device, GEN8_CP_RB_CNTL_GC, GEN8_CP_RB_CNTL_DEFAULT);
  1226. kgsl_regwrite(device, GEN8_CP_RB_BASE_LO_GC,
  1227. lower_32_bits(rb->buffer_desc->gpuaddr));
  1228. kgsl_regwrite(device, GEN8_CP_RB_BASE_HI_GC,
  1229. upper_32_bits(rb->buffer_desc->gpuaddr));
  1230. /* Program the ucode base for CP */
  1231. kgsl_regwrite(device, GEN8_CP_SQE_INSTR_BASE_LO,
  1232. lower_32_bits(fw->memdesc->gpuaddr));
  1233. kgsl_regwrite(device, GEN8_CP_SQE_INSTR_BASE_HI,
  1234. upper_32_bits(fw->memdesc->gpuaddr));
  1235. /* Clear the SQE_HALT to start the CP engine */
  1236. kgsl_regwrite(device, GEN8_CP_SQE_CNTL, 1);
  1237. ret = gen8_send_cp_init(adreno_dev, rb);
  1238. if (ret)
  1239. return ret;
  1240. ret = adreno_zap_shader_load(adreno_dev, gen8_core->zap_name);
  1241. if (ret)
  1242. return ret;
  1243. /*
  1244. * Take the GPU out of secure mode. Try the zap shader if it is loaded,
  1245. * otherwise just try to write directly to the secure control register
  1246. */
  1247. if (!adreno_dev->zap_loaded)
  1248. kgsl_regwrite(device, GEN8_RBBM_SECVID_TRUST_CNTL, 0);
  1249. else {
  1250. cmds = adreno_ringbuffer_allocspace(rb, 2);
  1251. if (IS_ERR(cmds))
  1252. return PTR_ERR(cmds);
  1253. *cmds++ = cp_type7_packet(CP_SET_SECURE_MODE, 1);
  1254. *cmds++ = 0;
  1255. ret = gen8_ringbuffer_submit(rb, NULL);
  1256. if (!ret) {
  1257. ret = adreno_spin_idle(adreno_dev, 2000);
  1258. if (ret) {
  1259. gen8_spin_idle_debug(adreno_dev,
  1260. "Switch to unsecure failed to idle\n");
  1261. return ret;
  1262. }
  1263. }
  1264. }
  1265. return gen8_post_start(adreno_dev);
  1266. }
  1267. /*
  1268. * gen8_gpu_keepalive() - GMU reg write to request GPU stays on
  1269. * @adreno_dev: Pointer to the adreno device that has the GMU
  1270. * @state: State to set: true is ON, false is OFF
  1271. */
  1272. static void gen8_gpu_keepalive(struct adreno_device *adreno_dev,
  1273. bool state)
  1274. {
  1275. gmu_core_regwrite(KGSL_DEVICE(adreno_dev),
  1276. GEN8_GMUCX_PWR_COL_KEEPALIVE, state);
  1277. }
  1278. bool gen8_hw_isidle(struct adreno_device *adreno_dev)
  1279. {
  1280. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1281. u32 reg;
  1282. gmu_core_regread(device, GEN8_GMUAO_GPU_CX_BUSY_STATUS, &reg);
  1283. /* Bit 23 is GPUBUSYIGNAHB */
  1284. return (reg & BIT(23)) ? false : true;
  1285. }
  1286. int gen8_microcode_read(struct adreno_device *adreno_dev)
  1287. {
  1288. struct adreno_firmware *sqe_fw = ADRENO_FW(adreno_dev, ADRENO_FW_SQE);
  1289. const struct adreno_gen8_core *gen8_core = to_gen8_core(adreno_dev);
  1290. return adreno_get_firmware(adreno_dev, gen8_core->sqefw_name, sqe_fw);
  1291. }
  1292. /* CP Interrupt bits */
  1293. #define GEN8_CP_GLOBAL_INT_HWFAULTBR 0
  1294. #define GEN8_CP_GLOBAL_INT_HWFAULTBV 1
  1295. #define GEN8_CP_GLOBAL_INT_HWFAULTLPAC 2
  1296. #define GEN8_CP_GLOBAL_INT_HWFAULTAQE0 3
  1297. #define GEN8_CP_GLOBAL_INT_HWFAULTAQE1 4
  1298. #define GEN8_CP_GLOBAL_INT_HWFAULTDDEBR 5
  1299. #define GEN8_CP_GLOBAL_INT_HWFAULTDDEBV 6
  1300. #define GEN8_CP_GLOBAL_INT_SWFAULTBR 16
  1301. #define GEN8_CP_GLOBAL_INT_SWFAULTBV 17
  1302. #define GEN8_CP_GLOBAL_INT_SWFAULTLPAC 18
  1303. #define GEN8_CP_GLOBAL_INT_SWFAULTAQE0 19
  1304. #define GEN8_CP_GLOBAL_INT_SWFAULTAQE1 20
  1305. #define GEN8_CP_GLOBAL_INT_SWFAULTDDEBR 21
  1306. #define GEN8_CP_GLOBAL_INT_SWFAULTDDEBV 22
  1307. /* CP HW Fault status bits */
  1308. #define CP_HW_RBFAULT 0
  1309. #define CP_HW_IB1FAULT 1
  1310. #define CP_HW_IB2FAULT 2
  1311. #define CP_HW_IB3FAULT 3
  1312. #define CP_HW_SDSFAULT 4
  1313. #define CP_HW_MRBFAULT 5
  1314. #define CP_HW_VSDFAULT 6
  1315. #define CP_HW_SQEREADBRUSTOVF 8
  1316. #define CP_HW_EVENTENGINEOVF 9
  1317. #define CP_HW_UCODEERROR 10
  1318. /* CP SW Fault status bits */
  1319. #define CP_SW_CSFRBWRAP 0
  1320. #define CP_SW_CSFIB1WRAP 1
  1321. #define CP_SW_CSFIB2WRAP 2
  1322. #define CP_SW_CSFIB3WRAP 3
  1323. #define CP_SW_SDSWRAP 4
  1324. #define CP_SW_MRBWRAP 5
  1325. #define CP_SW_VSDWRAP 6
  1326. #define CP_SW_OPCODEERROR 8
  1327. #define CP_SW_VSDPARITYERROR 9
  1328. #define CP_SW_REGISTERPROTECTIONERROR 10
  1329. #define CP_SW_ILLEGALINSTRUCTION 11
  1330. #define CP_SW_SMMUFAULT 12
  1331. #define CP_SW_VBIFRESPCLIENT 13
  1332. #define CP_SW_VBIFRESPTYPE 19
  1333. #define CP_SW_VBIFRESPREAD 21
  1334. #define CP_SW_VBIFRESP 22
  1335. #define CP_SW_RTWROVF 23
  1336. #define CP_SW_LRZRTWROVF 24
  1337. #define CP_SW_LRZRTREFCNTOVF 25
  1338. #define CP_SW_LRZRTCLRRESMISS 26
  1339. static void gen8_get_cp_hwfault_status(struct adreno_device *adreno_dev, u32 status)
  1340. {
  1341. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1342. u32 hw_status;
  1343. u32 pipe_id = PIPE_NONE;
  1344. const char * const table[] = {
  1345. [CP_HW_RBFAULT] = "RBFAULT",
  1346. [CP_HW_IB1FAULT] = "IB1FAULT",
  1347. [CP_HW_IB2FAULT] = "IB2FAULT",
  1348. [CP_HW_SDSFAULT] = "SDSFAULT",
  1349. [CP_HW_MRBFAULT] = "MRGFAULT",
  1350. [CP_HW_VSDFAULT] = "VSDFAULT",
  1351. [CP_HW_SQEREADBRUSTOVF] = "SQEREADBRUSTOVF",
  1352. [CP_HW_EVENTENGINEOVF] = "EVENTENGINEOVF",
  1353. [CP_HW_UCODEERROR] = "UCODEERROR",
  1354. };
  1355. switch (status) {
  1356. case BIT(GEN8_CP_GLOBAL_INT_HWFAULTBR):
  1357. pipe_id = PIPE_BR;
  1358. break;
  1359. case BIT(GEN8_CP_GLOBAL_INT_HWFAULTBV):
  1360. pipe_id = PIPE_BV;
  1361. break;
  1362. case BIT(GEN8_CP_GLOBAL_INT_HWFAULTLPAC):
  1363. pipe_id = PIPE_LPAC;
  1364. break;
  1365. case BIT(GEN8_CP_GLOBAL_INT_HWFAULTAQE0):
  1366. pipe_id = PIPE_AQE0;
  1367. break;
  1368. case BIT(GEN8_CP_GLOBAL_INT_HWFAULTAQE1):
  1369. pipe_id = PIPE_AQE1;
  1370. break;
  1371. case BIT(GEN8_CP_GLOBAL_INT_HWFAULTDDEBR):
  1372. pipe_id = PIPE_DDE_BR;
  1373. break;
  1374. case BIT(GEN8_CP_GLOBAL_INT_HWFAULTDDEBV):
  1375. pipe_id = PIPE_DDE_BV;
  1376. break;
  1377. }
  1378. gen8_regread_aperture(device, GEN8_CP_HW_FAULT_STATUS_PIPE, &hw_status,
  1379. pipe_id, 0, 0);
  1380. /* Clear aperture register */
  1381. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  1382. dev_crit_ratelimited(device->dev, "CP HW Fault pipe_id:%u %s\n", pipe_id,
  1383. hw_status < ARRAY_SIZE(table) ? table[hw_status] : "UNKNOWN");
  1384. }
  1385. static void gen8_get_cp_swfault_status(struct adreno_device *adreno_dev, u32 status)
  1386. {
  1387. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1388. u32 sw_status, status1;
  1389. u32 opcode, pipe_id = PIPE_NONE;
  1390. const char * const table[] = {
  1391. [CP_SW_CSFRBWRAP] = "CSFRBWRAP",
  1392. [CP_SW_CSFIB1WRAP] = "CSFIB1WRAP",
  1393. [CP_SW_CSFIB2WRAP] = "CSFIB2WRAP",
  1394. [CP_SW_CSFIB3WRAP] = "CSFIB3WRAP",
  1395. [CP_SW_SDSWRAP] = "SDSWRAP",
  1396. [CP_SW_MRBWRAP] = "MRBWRAP",
  1397. [CP_SW_VSDWRAP] = "VSDWRAP",
  1398. [CP_SW_OPCODEERROR] = "OPCODEERROR",
  1399. [CP_SW_VSDPARITYERROR] = "VSDPARITYERROR",
  1400. [CP_SW_REGISTERPROTECTIONERROR] = "REGISTERPROTECTIONERROR",
  1401. [CP_SW_ILLEGALINSTRUCTION] = "ILLEGALINSTRUCTION",
  1402. [CP_SW_SMMUFAULT] = "SMMUFAULT",
  1403. [CP_SW_VBIFRESPCLIENT] = "VBIFRESPCLIENT",
  1404. [CP_SW_VBIFRESPTYPE] = "VBIFRESPTYPE",
  1405. [CP_SW_VBIFRESPREAD] = "VBIFRESPREAD",
  1406. [CP_SW_VBIFRESP] = "VBIFRESP",
  1407. [CP_SW_RTWROVF] = "RTWROVF",
  1408. [CP_SW_LRZRTWROVF] = "LRZRTWROVF",
  1409. [CP_SW_LRZRTREFCNTOVF] = "LRZRTREFCNTOVF",
  1410. [CP_SW_LRZRTCLRRESMISS] = "LRZRTCLRRESMISS",
  1411. };
  1412. switch (status) {
  1413. case BIT(GEN8_CP_GLOBAL_INT_SWFAULTBR):
  1414. pipe_id = PIPE_BR;
  1415. break;
  1416. case BIT(GEN8_CP_GLOBAL_INT_SWFAULTBV):
  1417. pipe_id = PIPE_BV;
  1418. break;
  1419. case BIT(GEN8_CP_GLOBAL_INT_SWFAULTLPAC):
  1420. pipe_id = PIPE_LPAC;
  1421. break;
  1422. case BIT(GEN8_CP_GLOBAL_INT_SWFAULTAQE0):
  1423. pipe_id = PIPE_AQE0;
  1424. break;
  1425. case BIT(GEN8_CP_GLOBAL_INT_SWFAULTAQE1):
  1426. pipe_id = PIPE_AQE1;
  1427. break;
  1428. case BIT(GEN8_CP_GLOBAL_INT_SWFAULTDDEBR):
  1429. pipe_id = PIPE_DDE_BR;
  1430. break;
  1431. case BIT(GEN8_CP_GLOBAL_INT_SWFAULTDDEBV):
  1432. pipe_id = PIPE_DDE_BV;
  1433. break;
  1434. }
  1435. gen8_regread_aperture(device, GEN8_CP_INTERRUPT_STATUS_PIPE, &sw_status,
  1436. pipe_id, 0, 0);
  1437. dev_crit_ratelimited(device->dev, "CP SW Fault pipe_id: %u %s\n", pipe_id,
  1438. sw_status < ARRAY_SIZE(table) ? table[sw_status] : "UNKNOWN");
  1439. if (sw_status & BIT(CP_SW_OPCODEERROR)) {
  1440. gen8_regwrite_aperture(device, GEN8_CP_SQE_STAT_ADDR_PIPE, 1,
  1441. pipe_id, 0, 0);
  1442. gen8_regread_aperture(device, GEN8_CP_SQE_STAT_DATA_PIPE, &opcode,
  1443. pipe_id, 0, 0);
  1444. dev_crit_ratelimited(device->dev,
  1445. "CP opcode error interrupt | opcode=0x%8.8x\n", opcode);
  1446. }
  1447. if (sw_status & BIT(CP_SW_REGISTERPROTECTIONERROR)) {
  1448. gen8_regread_aperture(device, GEN8_CP_PROTECT_STATUS_PIPE, &status1,
  1449. pipe_id, 0, 0);
  1450. dev_crit_ratelimited(device->dev,
  1451. "CP | Protected mode error | %s | addr=%lx | status=%x\n",
  1452. FIELD_GET(GENMASK(20, 20), status1) ? "READ" : "WRITE",
  1453. FIELD_GET(GENMASK(17, 0), status1), status1);
  1454. }
  1455. /* Clear aperture register */
  1456. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  1457. }
  1458. static void gen8_cp_hw_err_callback(struct adreno_device *adreno_dev, int bit)
  1459. {
  1460. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1461. u32 global_status;
  1462. u32 hw_fault, sw_fault;
  1463. kgsl_regread(device, GEN8_CP_INTERRUPT_STATUS_GLOBAL, &global_status);
  1464. dev_crit_ratelimited(device->dev, "CP fault int_status_global=0x%x\n", global_status);
  1465. hw_fault = FIELD_GET(GENMASK(6, 0), global_status);
  1466. sw_fault = FIELD_GET(GENMASK(22, 16), global_status);
  1467. if (hw_fault)
  1468. gen8_get_cp_hwfault_status(adreno_dev, hw_fault);
  1469. else if (sw_fault)
  1470. gen8_get_cp_swfault_status(adreno_dev, sw_fault);
  1471. }
  1472. static void gen8_err_callback(struct adreno_device *adreno_dev, int bit)
  1473. {
  1474. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1475. switch (bit) {
  1476. case GEN8_INT_AHBERROR:
  1477. {
  1478. u32 err_details_0, err_details_1;
  1479. kgsl_regread(device, GEN8_CP_RL_ERROR_DETAILS_0, &err_details_0);
  1480. kgsl_regread(device, GEN8_CP_RL_ERROR_DETAILS_1, &err_details_1);
  1481. dev_crit_ratelimited(device->dev,
  1482. "CP: AHB bus error, CP_RL_ERROR_DETAILS_0:0x%x CP_RL_ERROR_DETAILS_1:0x%x\n",
  1483. err_details_0, err_details_1);
  1484. break;
  1485. }
  1486. case GEN8_INT_ATBASYNCFIFOOVERFLOW:
  1487. dev_crit_ratelimited(device->dev, "RBBM: ATB ASYNC overflow\n");
  1488. break;
  1489. case GEN8_INT_ATBBUSOVERFLOW:
  1490. dev_crit_ratelimited(device->dev, "RBBM: ATB bus overflow\n");
  1491. break;
  1492. case GEN8_INT_OUTOFBOUNDACCESS:
  1493. dev_crit_ratelimited(device->dev, "UCHE: Out of bounds access\n");
  1494. break;
  1495. case GEN8_INT_UCHETRAPINTERRUPT:
  1496. dev_crit_ratelimited(device->dev, "UCHE: Trap interrupt\n");
  1497. break;
  1498. case GEN8_INT_TSBWRITEERROR:
  1499. {
  1500. u32 lo, hi;
  1501. kgsl_regread(device, GEN8_RBBM_SECVID_TSB_STATUS_LO, &lo);
  1502. kgsl_regread(device, GEN8_RBBM_SECVID_TSB_STATUS_HI, &hi);
  1503. dev_crit_ratelimited(device->dev, "TSB: Write error interrupt: Address: 0x%lx MID: %lu\n",
  1504. FIELD_GET(GENMASK(16, 0), hi) << 32 | lo,
  1505. FIELD_GET(GENMASK(31, 23), hi));
  1506. break;
  1507. }
  1508. default:
  1509. dev_crit_ratelimited(device->dev, "Unknown interrupt %d\n", bit);
  1510. }
  1511. }
  1512. static const char *const uche_client[] = {
  1513. "BR_VFD", "BR_SP", "BR_VSC", "BR_VPC",
  1514. "BR_HLSQ", "BR_PC", "BR_LRZ", "BR_TP",
  1515. "BV_VFD", "BV_SP", "BV_VSC", "BV_VPC",
  1516. "BV_HLSQ", "BV_PC", "BV_LRZ", "BV_TP",
  1517. "STCHE",
  1518. };
  1519. static const char *const uche_lpac_client[] = {
  1520. "-", "SP_LPAC", "-", "-", "HLSQ_LPAC", "-", "-", "TP_LPAC"
  1521. };
  1522. #define SCOOBYDOO 0x5c00bd00
  1523. static const char *gen8_fault_block_uche(struct kgsl_device *device,
  1524. char *str, int size, bool lpac)
  1525. {
  1526. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  1527. u32 uche_client_id = adreno_dev->uche_client_pf;
  1528. const char *uche_client_str, *fault_block;
  1529. /*
  1530. * Smmu driver takes a vote on CX gdsc before calling the kgsl
  1531. * pagefault handler. If there is contention for device mutex in this
  1532. * path and the dispatcher fault handler is holding this lock, trying
  1533. * to turn off CX gdsc will fail during the reset. So to avoid blocking
  1534. * here, try to lock device mutex and return if it fails.
  1535. */
  1536. if (!mutex_trylock(&device->mutex))
  1537. goto regread_fail;
  1538. if (!kgsl_state_is_awake(device)) {
  1539. mutex_unlock(&device->mutex);
  1540. goto regread_fail;
  1541. }
  1542. kgsl_regread(device, GEN8_UCHE_CLIENT_PF, &uche_client_id);
  1543. mutex_unlock(&device->mutex);
  1544. /* Ignore the value if the gpu is in IFPC */
  1545. if (uche_client_id == SCOOBYDOO) {
  1546. uche_client_id = adreno_dev->uche_client_pf;
  1547. goto regread_fail;
  1548. }
  1549. /* UCHE client id mask is bits [6:0] */
  1550. uche_client_id &= GENMASK(6, 0);
  1551. regread_fail:
  1552. if (lpac) {
  1553. fault_block = "UCHE_LPAC";
  1554. if (uche_client_id >= ARRAY_SIZE(uche_lpac_client))
  1555. goto fail;
  1556. uche_client_str = uche_lpac_client[uche_client_id];
  1557. } else {
  1558. fault_block = "UCHE";
  1559. if (uche_client_id >= ARRAY_SIZE(uche_client))
  1560. goto fail;
  1561. uche_client_str = uche_client[uche_client_id];
  1562. }
  1563. snprintf(str, size, "%s: %s", fault_block, uche_client_str);
  1564. return str;
  1565. fail:
  1566. snprintf(str, size, "%s: Unknown (client_id: %u)",
  1567. fault_block, uche_client_id);
  1568. return str;
  1569. }
  1570. static const char *gen8_iommu_fault_block(struct kgsl_device *device,
  1571. u32 fsynr1)
  1572. {
  1573. u32 mid = fsynr1 & 0xff;
  1574. static char str[36];
  1575. switch (mid) {
  1576. case 0x0:
  1577. return "CP";
  1578. case 0x1:
  1579. return "UCHE: Unknown";
  1580. case 0x2:
  1581. return "UCHE_LPAC: Unknown";
  1582. case 0x3:
  1583. return gen8_fault_block_uche(device, str, sizeof(str), false);
  1584. case 0x4:
  1585. return "CCU";
  1586. case 0x5:
  1587. return "Flag cache";
  1588. case 0x6:
  1589. return "PREFETCH";
  1590. case 0x7:
  1591. return "GMU";
  1592. case 0x8:
  1593. return gen8_fault_block_uche(device, str, sizeof(str), true);
  1594. case 0x9:
  1595. return "UCHE_HPAC";
  1596. }
  1597. snprintf(str, sizeof(str), "Unknown (mid: %u)", mid);
  1598. return str;
  1599. }
  1600. static void gen8_cp_callback(struct adreno_device *adreno_dev, int bit)
  1601. {
  1602. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1603. if (adreno_is_preemption_enabled(adreno_dev))
  1604. gen8_preemption_trigger(adreno_dev, true);
  1605. adreno_dispatcher_schedule(device);
  1606. }
  1607. /*
  1608. * gen8_gpc_err_int_callback() - Isr for GPC error interrupts
  1609. * @adreno_dev: Pointer to device
  1610. * @bit: Interrupt bit
  1611. */
  1612. static void gen8_gpc_err_int_callback(struct adreno_device *adreno_dev, int bit)
  1613. {
  1614. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1615. /*
  1616. * GPC error is typically the result of mistake SW programming.
  1617. * Force GPU fault for this interrupt so that we can debug it
  1618. * with help of register dump.
  1619. */
  1620. dev_crit(device->dev, "RBBM: GPC error\n");
  1621. adreno_irqctrl(adreno_dev, 0);
  1622. /* Trigger a fault in the dispatcher - this will effect a restart */
  1623. adreno_dispatcher_fault(adreno_dev, ADRENO_SOFT_FAULT);
  1624. }
  1625. /*
  1626. * gen8_swfuse_violation_callback() - ISR for software fuse violation interrupt
  1627. * @adreno_dev: Pointer to device
  1628. * @bit: Interrupt bit
  1629. */
  1630. static void gen8_swfuse_violation_callback(struct adreno_device *adreno_dev, int bit)
  1631. {
  1632. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1633. u32 status;
  1634. /*
  1635. * SWFUSEVIOLATION error is typically the result of enabling software
  1636. * feature which is not supported by the hardware. Following are the
  1637. * Feature violation will be reported
  1638. * 1) FASTBLEND (BIT:0): NO Fault, RB will send the workload to legacy
  1639. * blender HW pipeline.
  1640. * 2) LPAC (BIT:1): Fault
  1641. * 3) RAYTRACING (BIT:2): Fault
  1642. */
  1643. kgsl_regread(device, GEN8_RBBM_SW_FUSE_INT_STATUS, &status);
  1644. /*
  1645. * RBBM_INT_CLEAR_CMD will not clear SWFUSEVIOLATION interrupt. Hence
  1646. * do explicit swfuse irq clear.
  1647. */
  1648. kgsl_regwrite(device, GEN8_RBBM_SW_FUSE_INT_MASK, 0);
  1649. dev_crit_ratelimited(device->dev,
  1650. "RBBM: SW Feature Fuse violation status=0x%8.8x\n", status);
  1651. /* Trigger a fault in the dispatcher for LPAC and RAYTRACING violation */
  1652. if (status & GENMASK(GEN8_RAYTRACING_SW_FUSE, GEN8_LPAC_SW_FUSE)) {
  1653. adreno_irqctrl(adreno_dev, 0);
  1654. adreno_dispatcher_fault(adreno_dev, ADRENO_HARD_FAULT);
  1655. }
  1656. }
  1657. static const struct adreno_irq_funcs gen8_irq_funcs[32] = {
  1658. ADRENO_IRQ_CALLBACK(NULL), /* 0 - RBBM_GPU_IDLE */
  1659. ADRENO_IRQ_CALLBACK(gen8_err_callback), /* 1 - RBBM_AHB_ERROR */
  1660. ADRENO_IRQ_CALLBACK(NULL), /* 2 - UNUSED */
  1661. ADRENO_IRQ_CALLBACK(NULL), /* 3 - UNUSED */
  1662. ADRENO_IRQ_CALLBACK(NULL), /* 4 - CPIPCINT0 */
  1663. ADRENO_IRQ_CALLBACK(NULL), /* 5 - CPIPCINT1 */
  1664. ADRENO_IRQ_CALLBACK(gen8_err_callback), /* 6 - ATBASYNCOVERFLOW */
  1665. ADRENO_IRQ_CALLBACK(gen8_gpc_err_int_callback), /* 7 - GPC_ERR */
  1666. ADRENO_IRQ_CALLBACK(gen8_preemption_callback),/* 8 - CP_SW */
  1667. ADRENO_IRQ_CALLBACK(gen8_cp_hw_err_callback), /* 9 - CP_HW_ERROR */
  1668. ADRENO_IRQ_CALLBACK(NULL), /* 10 - CP_CCU_FLUSH_DEPTH_TS */
  1669. ADRENO_IRQ_CALLBACK(NULL), /* 11 - CP_CCU_FLUSH_COLOR_TS */
  1670. ADRENO_IRQ_CALLBACK(NULL), /* 12 - CP_CCU_RESOLVE_TS */
  1671. ADRENO_IRQ_CALLBACK(NULL), /* 13 - UNUSED */
  1672. ADRENO_IRQ_CALLBACK(NULL), /* 14 - UNUSED */
  1673. ADRENO_IRQ_CALLBACK(adreno_cp_callback), /* 15 - CP_RB_INT */
  1674. ADRENO_IRQ_CALLBACK(NULL), /* 16 - CP_RB_INT_LPAC*/
  1675. ADRENO_IRQ_CALLBACK(NULL), /* 17 - CP_RB_DONE_TS */
  1676. ADRENO_IRQ_CALLBACK(NULL), /* 18 - UNUSED */
  1677. ADRENO_IRQ_CALLBACK(NULL), /* 19 - UNUSED */
  1678. ADRENO_IRQ_CALLBACK(gen8_cp_callback), /* 20 - CP_CACHE_FLUSH_TS */
  1679. ADRENO_IRQ_CALLBACK(NULL), /* 21 - CP_CACHE_TS_LPAC */
  1680. ADRENO_IRQ_CALLBACK(gen8_err_callback), /* 22 - RBBM_ATB_BUS_OVERFLOW */
  1681. ADRENO_IRQ_CALLBACK(adreno_hang_int_callback), /* 23 - MISHANGDETECT */
  1682. ADRENO_IRQ_CALLBACK(gen8_err_callback), /* 24 - UCHE_OOB_ACCESS */
  1683. ADRENO_IRQ_CALLBACK(gen8_err_callback), /* 25 - UCHE_TRAP_INTR */
  1684. ADRENO_IRQ_CALLBACK(NULL), /* 26 - DEBBUS_INTR_0 */
  1685. ADRENO_IRQ_CALLBACK(NULL), /* 27 - DEBBUS_INTR_1 */
  1686. ADRENO_IRQ_CALLBACK(gen8_err_callback), /* 28 - TSBWRITEERROR */
  1687. ADRENO_IRQ_CALLBACK(gen8_swfuse_violation_callback), /* 29 - SWFUSEVIOLATION */
  1688. ADRENO_IRQ_CALLBACK(NULL), /* 30 - ISDB_CPU_IRQ */
  1689. ADRENO_IRQ_CALLBACK(NULL), /* 31 - ISDB_UNDER_DEBUG */
  1690. };
  1691. /*
  1692. * If the AHB fence is not in ALLOW mode when we receive an RBBM
  1693. * interrupt, something went wrong. This means that we cannot proceed
  1694. * since the IRQ status and clear registers are not accessible.
  1695. * This is usually harmless because the GMU will abort power collapse
  1696. * and change the fence back to ALLOW. Poll so that this can happen.
  1697. */
  1698. static int gen8_irq_poll_fence(struct adreno_device *adreno_dev)
  1699. {
  1700. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1701. const struct adreno_gpudev *gpudev = ADRENO_GPU_DEVICE(adreno_dev);
  1702. u32 status, fence, fence_retries = 0;
  1703. u64 a, b, c;
  1704. a = gpudev->read_alwayson(adreno_dev);
  1705. kgsl_regread(device, GEN8_GMUAO_AHB_FENCE_CTRL, &fence);
  1706. while (fence != 0) {
  1707. b = gpudev->read_alwayson(adreno_dev);
  1708. /* Wait for small time before trying again */
  1709. udelay(1);
  1710. kgsl_regread(device, GEN8_GMUAO_AHB_FENCE_CTRL, &fence);
  1711. if (fence_retries == 100 && fence != 0) {
  1712. c = gpudev->read_alwayson(adreno_dev);
  1713. kgsl_regread(device, GEN8_GMUAO_RBBM_INT_UNMASKED_STATUS_SHADOW,
  1714. &status);
  1715. dev_crit_ratelimited(device->dev,
  1716. "status=0x%x Unmasked status=0x%x Mask=0x%x timestamps: %llx %llx %llx\n",
  1717. status & adreno_dev->irq_mask, status,
  1718. adreno_dev->irq_mask, a, b, c);
  1719. return -ETIMEDOUT;
  1720. }
  1721. fence_retries++;
  1722. }
  1723. return 0;
  1724. }
  1725. static irqreturn_t gen8_irq_handler(struct adreno_device *adreno_dev)
  1726. {
  1727. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1728. irqreturn_t ret = IRQ_NONE;
  1729. u32 status;
  1730. /*
  1731. * GPU can power down once the INT_0_STATUS is read below.
  1732. * But there still might be some register reads required so
  1733. * force the GMU/GPU into KEEPALIVE mode until done with the ISR.
  1734. */
  1735. gen8_gpu_keepalive(adreno_dev, true);
  1736. if (gen8_irq_poll_fence(adreno_dev)) {
  1737. adreno_dispatcher_fault(adreno_dev, ADRENO_GMU_FAULT);
  1738. goto done;
  1739. }
  1740. kgsl_regread(device, GEN8_RBBM_INT_0_STATUS, &status);
  1741. kgsl_regwrite(device, GEN8_RBBM_INT_CLEAR_CMD, status);
  1742. ret = adreno_irq_callbacks(adreno_dev, gen8_irq_funcs, status);
  1743. trace_kgsl_gen8_irq_status(adreno_dev, status);
  1744. done:
  1745. /* If hard fault, then let snapshot turn off the keepalive */
  1746. if (!(adreno_gpu_fault(adreno_dev) & ADRENO_HARD_FAULT))
  1747. gen8_gpu_keepalive(adreno_dev, false);
  1748. return ret;
  1749. }
  1750. static irqreturn_t gen8_cx_host_irq_handler(int irq, void *data)
  1751. {
  1752. struct kgsl_device *device = data;
  1753. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  1754. u32 status;
  1755. adreno_cx_misc_regread(adreno_dev, GEN8_GPU_CX_MISC_INT_0_STATUS, &status);
  1756. adreno_cx_misc_regwrite(adreno_dev, GEN8_GPU_CX_MISC_INT_CLEAR_CMD, status);
  1757. if (status & BIT(GEN8_CX_MISC_GPU_CC_IRQ))
  1758. KGSL_PWRCTRL_LOG_FREQLIM(device);
  1759. if (status & ~GEN8_CX_MISC_INT_MASK)
  1760. dev_err_ratelimited(device->dev, "Unhandled CX MISC interrupts 0x%lx\n",
  1761. status & ~GEN8_CX_MISC_INT_MASK);
  1762. return IRQ_HANDLED;
  1763. }
  1764. int gen8_probe_common(struct platform_device *pdev,
  1765. struct adreno_device *adreno_dev, u32 chipid,
  1766. const struct adreno_gpu_core *gpucore)
  1767. {
  1768. const struct adreno_gpudev *gpudev = gpucore->gpudev;
  1769. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1770. const struct adreno_gen8_core *gen8_core = container_of(gpucore,
  1771. struct adreno_gen8_core, base);
  1772. int ret;
  1773. adreno_dev->gpucore = gpucore;
  1774. adreno_dev->chipid = chipid;
  1775. adreno_reg_offset_init(gpudev->reg_offsets);
  1776. adreno_dev->hwcg_enabled = true;
  1777. adreno_dev->uche_client_pf = 1;
  1778. kgsl_pwrscale_fast_bus_hint(gen8_core->fast_bus_hint);
  1779. device->pwrctrl.cx_cfg_gdsc_offset = GEN8_GPU_CC_CX_CFG_GDSCR;
  1780. device->pwrctrl.rt_bus_hint = gen8_core->rt_bus_hint;
  1781. device->cx_host_irq_num = kgsl_request_irq_optional(pdev,
  1782. "cx_host_irq", gen8_cx_host_irq_handler, device);
  1783. ret = adreno_device_probe(pdev, adreno_dev);
  1784. if (ret)
  1785. return ret;
  1786. if (adreno_preemption_feature_set(adreno_dev)) {
  1787. adreno_dev->preempt.preempt_level = gen8_core->preempt_level;
  1788. adreno_dev->preempt.skipsaverestore = true;
  1789. adreno_dev->preempt.usesgmem = true;
  1790. set_bit(ADRENO_DEVICE_PREEMPTION, &adreno_dev->priv);
  1791. }
  1792. /* debugfs node for ACD calibration */
  1793. debugfs_create_file("acd_calibrate", 0644, device->d_debugfs, device, &acd_cal_fops);
  1794. /* Dump additional AQE 16KB data on top of default 128KB(64(BR)+64(BV)) */
  1795. device->snapshot_ctxt_record_size = ADRENO_FEATURE(adreno_dev, ADRENO_AQE) ?
  1796. (GEN8_SNAPSHOT_CTXRECORD_SIZE_IN_BYTES + SZ_16K) :
  1797. GEN8_SNAPSHOT_CTXRECORD_SIZE_IN_BYTES;
  1798. return 0;
  1799. }
  1800. /* Register offset defines for Gen8, in order of enum adreno_regs */
  1801. static u32 gen8_register_offsets[ADRENO_REG_REGISTER_MAX] = {
  1802. ADRENO_REG_DEFINE(ADRENO_REG_CP_RB_BASE, GEN8_CP_RB_BASE_LO_GC),
  1803. ADRENO_REG_DEFINE(ADRENO_REG_CP_RB_BASE_HI, GEN8_CP_RB_BASE_HI_GC),
  1804. ADRENO_REG_DEFINE(ADRENO_REG_CP_RB_RPTR, GEN8_CP_RB_RPTR_BR),
  1805. ADRENO_REG_DEFINE(ADRENO_REG_CP_RB_WPTR, GEN8_CP_RB_WPTR_GC),
  1806. ADRENO_REG_DEFINE(ADRENO_REG_CP_ME_CNTL, GEN8_CP_SQE_CNTL),
  1807. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB1_BASE, GEN8_CP_IB1_BASE_LO_PIPE),
  1808. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB1_BASE_HI, GEN8_CP_IB1_BASE_HI_PIPE),
  1809. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB1_BUFSZ, GEN8_CP_IB1_REM_SIZE_PIPE),
  1810. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB2_BASE, GEN8_CP_IB2_BASE_LO_PIPE),
  1811. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB2_BASE_HI, GEN8_CP_IB2_BASE_HI_PIPE),
  1812. ADRENO_REG_DEFINE(ADRENO_REG_CP_IB2_BUFSZ, GEN8_CP_IB2_REM_SIZE_PIPE),
  1813. ADRENO_REG_DEFINE(ADRENO_REG_RBBM_STATUS, GEN8_RBBM_STATUS),
  1814. ADRENO_REG_DEFINE(ADRENO_REG_RBBM_INT_0_MASK, GEN8_RBBM_INT_0_MASK),
  1815. ADRENO_REG_DEFINE(ADRENO_REG_RBBM_SW_RESET_CMD, GEN8_RBBM_SW_RESET_CMD),
  1816. ADRENO_REG_DEFINE(ADRENO_REG_GMU_AO_HOST_INTERRUPT_MASK,
  1817. GEN8_GMUAO_AO_HOST_INTERRUPT_MASK),
  1818. ADRENO_REG_DEFINE(ADRENO_REG_GMU_GMU2HOST_INTR_MASK,
  1819. GEN8_GMUCX_GMU2HOST_INTR_MASK),
  1820. };
  1821. static u32 _get_pipeid(u32 groupid)
  1822. {
  1823. switch (groupid) {
  1824. case KGSL_PERFCOUNTER_GROUP_BV_PC:
  1825. fallthrough;
  1826. case KGSL_PERFCOUNTER_GROUP_BV_VFD:
  1827. fallthrough;
  1828. case KGSL_PERFCOUNTER_GROUP_BV_VPC:
  1829. fallthrough;
  1830. case KGSL_PERFCOUNTER_GROUP_BV_TSE:
  1831. fallthrough;
  1832. case KGSL_PERFCOUNTER_GROUP_BV_RAS:
  1833. fallthrough;
  1834. case KGSL_PERFCOUNTER_GROUP_BV_LRZ:
  1835. fallthrough;
  1836. case KGSL_PERFCOUNTER_GROUP_BV_HLSQ:
  1837. return PIPE_BV;
  1838. case KGSL_PERFCOUNTER_GROUP_PC:
  1839. fallthrough;
  1840. case KGSL_PERFCOUNTER_GROUP_VFD:
  1841. fallthrough;
  1842. case KGSL_PERFCOUNTER_GROUP_HLSQ:
  1843. fallthrough;
  1844. case KGSL_PERFCOUNTER_GROUP_VPC:
  1845. fallthrough;
  1846. case KGSL_PERFCOUNTER_GROUP_CCU:
  1847. fallthrough;
  1848. case KGSL_PERFCOUNTER_GROUP_CMP:
  1849. fallthrough;
  1850. case KGSL_PERFCOUNTER_GROUP_TSE:
  1851. fallthrough;
  1852. case KGSL_PERFCOUNTER_GROUP_RAS:
  1853. fallthrough;
  1854. case KGSL_PERFCOUNTER_GROUP_LRZ:
  1855. fallthrough;
  1856. case KGSL_PERFCOUNTER_GROUP_RB:
  1857. return PIPE_BR;
  1858. default:
  1859. return PIPE_NONE;
  1860. }
  1861. }
  1862. int gen8_perfcounter_remove(struct adreno_device *adreno_dev,
  1863. struct adreno_perfcount_register *reg, u32 groupid)
  1864. {
  1865. const struct adreno_perfcounters *counters = ADRENO_PERFCOUNTERS(adreno_dev);
  1866. struct gen8_device *gen8_dev = container_of(adreno_dev, struct gen8_device, adreno_dev);
  1867. const struct adreno_perfcount_group *group;
  1868. void *ptr = adreno_dev->pwrup_reglist->hostptr;
  1869. struct cpu_gpu_lock *lock = ptr;
  1870. u32 offset = ((lock->ifpc_list_len + lock->preemption_list_len) * 2) +
  1871. (gen8_dev->ext_pwrup_list_len * 3);
  1872. int i, last_offset, num_removed, start_offset = -1;
  1873. u32 *data = ptr + sizeof(*lock), pipe = FIELD_PREP(GENMASK(13, 12), _get_pipeid(groupid));
  1874. u16 perfcntr_list_len = lock->dynamic_list_len - gen8_dev->ext_pwrup_list_len;
  1875. if (!perfcntr_list_len)
  1876. return -EINVAL;
  1877. group = &(counters->groups[groupid]);
  1878. if (!(group->flags & ADRENO_PERFCOUNTER_GROUP_RESTORE)) {
  1879. if (perfcntr_list_len != 2)
  1880. return 0;
  1881. if (kgsl_hwlock(lock)) {
  1882. kgsl_hwunlock(lock);
  1883. return -EBUSY;
  1884. }
  1885. goto disable_perfcounter;
  1886. }
  1887. last_offset = offset + (perfcntr_list_len * 3);
  1888. /* Look for the perfcounter to remove in the list */
  1889. for (i = 0; i < perfcntr_list_len - 2; i++) {
  1890. if ((data[offset + 1] == reg->select) && (data[offset] == pipe)) {
  1891. start_offset = offset;
  1892. break;
  1893. }
  1894. offset += 3;
  1895. }
  1896. if (start_offset == -1)
  1897. return -ENOENT;
  1898. for (i = 0; i < PERFCOUNTER_REG_DEPENDENCY_LEN && reg->reg_dependency[i]; i++)
  1899. offset += 3;
  1900. if (kgsl_hwlock(lock)) {
  1901. kgsl_hwunlock(lock);
  1902. return -EBUSY;
  1903. }
  1904. /* Let offset point to the first entry that is going to be retained */
  1905. offset += 3;
  1906. memcpy(&data[start_offset], &data[offset], (last_offset - offset) * sizeof(u32));
  1907. memset(&data[start_offset + (last_offset - offset)], 0,
  1908. (offset - start_offset) * sizeof(u32));
  1909. num_removed = offset - start_offset;
  1910. do_div(num_removed, 3);
  1911. lock->dynamic_list_len -= num_removed;
  1912. disable_perfcounter:
  1913. /*
  1914. * If dynamic list length is 2 and no_restore_count is 0, then we can remove
  1915. * the perfcounter controls from the list.
  1916. */
  1917. if (perfcntr_list_len == 2 && !adreno_dev->no_restore_count) {
  1918. memset(&data[offset], 0, 6 * sizeof(u32));
  1919. lock->dynamic_list_len = gen8_dev->ext_pwrup_list_len;
  1920. }
  1921. kgsl_hwunlock(lock);
  1922. return 0;
  1923. }
  1924. int gen8_perfcounter_update(struct adreno_device *adreno_dev,
  1925. struct adreno_perfcount_register *reg, bool update_reg, u32 pipe, unsigned long flags)
  1926. {
  1927. struct gen8_device *gen8_dev = container_of(adreno_dev, struct gen8_device, adreno_dev);
  1928. void *ptr = adreno_dev->pwrup_reglist->hostptr;
  1929. struct cpu_gpu_lock *lock = ptr;
  1930. u32 offset = ((lock->ifpc_list_len + lock->preemption_list_len) * 2) +
  1931. (gen8_dev->ext_pwrup_list_len * 3);
  1932. u32 *data = ptr + sizeof(*lock);
  1933. int i, start_offset = -1;
  1934. u16 perfcntr_list_len = lock->dynamic_list_len - gen8_dev->ext_pwrup_list_len;
  1935. if (flags & ADRENO_PERFCOUNTER_GROUP_RESTORE) {
  1936. for (i = 0; i < perfcntr_list_len - 2; i++) {
  1937. if ((data[offset + 1] == reg->select) && (data[offset] == pipe)) {
  1938. start_offset = offset;
  1939. break;
  1940. }
  1941. offset += 3;
  1942. }
  1943. } else if (perfcntr_list_len) {
  1944. goto update;
  1945. }
  1946. if (kgsl_hwlock(lock)) {
  1947. kgsl_hwunlock(lock);
  1948. return -EBUSY;
  1949. }
  1950. /*
  1951. * If the perfcounter select register is already present in reglist
  1952. * update it, otherwise append the <aperture, select register, value>
  1953. * triplet to the end of the list.
  1954. */
  1955. if (start_offset != -1) {
  1956. data[offset + 2] = reg->countable;
  1957. for (i = 0; i < PERFCOUNTER_REG_DEPENDENCY_LEN && reg->reg_dependency[i]; i++) {
  1958. offset += 3;
  1959. data[offset + 2] = reg->countable;
  1960. }
  1961. kgsl_hwunlock(lock);
  1962. goto update;
  1963. }
  1964. /* Initialize the lock->dynamic_list_len to account for perfcounter controls */
  1965. if (!perfcntr_list_len)
  1966. lock->dynamic_list_len = gen8_dev->ext_pwrup_list_len + 2;
  1967. /*
  1968. * For all targets GEN8_SLICE_RBBM_PERFCTR_CNTL needs to be the last entry,
  1969. * so overwrite the existing GEN8_SLICE_RBBM_PERFCNTL_CNTL and add it back to
  1970. * the end.
  1971. */
  1972. if (flags & ADRENO_PERFCOUNTER_GROUP_RESTORE) {
  1973. data[offset++] = pipe;
  1974. data[offset++] = reg->select;
  1975. data[offset++] = reg->countable;
  1976. lock->dynamic_list_len++;
  1977. for (i = 0; i < PERFCOUNTER_REG_DEPENDENCY_LEN && reg->reg_dependency[i]; i++) {
  1978. data[offset++] = pipe;
  1979. data[offset++] = reg->reg_dependency[i];
  1980. data[offset++] = reg->countable;
  1981. lock->dynamic_list_len++;
  1982. }
  1983. }
  1984. data[offset++] = FIELD_PREP(GENMASK(15, 12), PIPE_NONE);
  1985. data[offset++] = GEN8_RBBM_PERFCTR_CNTL;
  1986. data[offset++] = 1;
  1987. data[offset++] = FIELD_PREP(GENMASK(15, 12), PIPE_NONE);
  1988. data[offset++] = GEN8_RBBM_SLICE_PERFCTR_CNTL;
  1989. data[offset++] = 1;
  1990. kgsl_hwunlock(lock);
  1991. update:
  1992. if (update_reg) {
  1993. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  1994. kgsl_regwrite(device, reg->select, reg->countable);
  1995. for (i = 0; i < PERFCOUNTER_REG_DEPENDENCY_LEN && reg->reg_dependency[i]; i++)
  1996. kgsl_regwrite(device, reg->reg_dependency[i], reg->countable);
  1997. }
  1998. return 0;
  1999. }
  2000. static u64 gen8_read_alwayson(struct adreno_device *adreno_dev)
  2001. {
  2002. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  2003. u32 lo = 0, hi = 0, tmp = 0;
  2004. /* Always use the GMU AO counter when doing a AHB read */
  2005. gmu_core_regread(device, GEN8_GMUCX_AO_COUNTER_HI, &hi);
  2006. gmu_core_regread(device, GEN8_GMUCX_AO_COUNTER_LO, &lo);
  2007. /* Check for overflow */
  2008. gmu_core_regread(device, GEN8_GMUCX_AO_COUNTER_HI, &tmp);
  2009. if (hi != tmp) {
  2010. gmu_core_regread(device, GEN8_GMUCX_AO_COUNTER_LO,
  2011. &lo);
  2012. hi = tmp;
  2013. }
  2014. return (((u64) hi) << 32) | lo;
  2015. }
  2016. static int gen8_lpac_store(struct adreno_device *adreno_dev, bool enable)
  2017. {
  2018. if (!ADRENO_FEATURE(adreno_dev, ADRENO_LPAC))
  2019. return -EINVAL;
  2020. if (!(adreno_dev->feature_fuse & BIT(GEN8_LPAC_SW_FUSE)) ||
  2021. (adreno_dev->lpac_enabled == enable))
  2022. return 0;
  2023. /* Power down the GPU before changing the lpac setting */
  2024. return adreno_power_cycle_bool(adreno_dev, &adreno_dev->lpac_enabled, enable);
  2025. }
  2026. static void gen8_remove(struct adreno_device *adreno_dev)
  2027. {
  2028. if (adreno_preemption_feature_set(adreno_dev))
  2029. del_timer(&adreno_dev->preempt.timer);
  2030. }
  2031. static void gen8_read_bus_stats(struct kgsl_device *device,
  2032. struct kgsl_power_stats *stats,
  2033. struct adreno_busy_data *busy)
  2034. {
  2035. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  2036. u64 ram_cycles, starved_ram;
  2037. ram_cycles = counter_delta(device, adreno_dev->ram_cycles_lo,
  2038. &busy->bif_ram_cycles);
  2039. starved_ram = counter_delta(device, adreno_dev->starved_ram_lo,
  2040. &busy->bif_starved_ram);
  2041. ram_cycles += counter_delta(device,
  2042. adreno_dev->ram_cycles_lo_ch1_read,
  2043. &busy->bif_ram_cycles_read_ch1);
  2044. ram_cycles += counter_delta(device,
  2045. adreno_dev->ram_cycles_lo_ch0_write,
  2046. &busy->bif_ram_cycles_write_ch0);
  2047. ram_cycles += counter_delta(device,
  2048. adreno_dev->ram_cycles_lo_ch1_write,
  2049. &busy->bif_ram_cycles_write_ch1);
  2050. starved_ram += counter_delta(device,
  2051. adreno_dev->starved_ram_lo_ch1,
  2052. &busy->bif_starved_ram_ch1);
  2053. stats->ram_time = ram_cycles;
  2054. stats->ram_wait = starved_ram;
  2055. }
  2056. static void gen8_power_stats(struct adreno_device *adreno_dev,
  2057. struct kgsl_power_stats *stats)
  2058. {
  2059. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  2060. struct adreno_busy_data *busy = &adreno_dev->busy_data;
  2061. u64 gpu_busy;
  2062. /* Set the GPU busy counter for frequency scaling */
  2063. gpu_busy = counter_delta(device, GEN8_GMUCX_POWER_COUNTER_XOCLK_L_0,
  2064. &busy->gpu_busy);
  2065. stats->busy_time = gpu_busy * 10;
  2066. do_div(stats->busy_time, 192);
  2067. if (ADRENO_FEATURE(adreno_dev, ADRENO_IFPC)) {
  2068. u32 ifpc = counter_delta(device,
  2069. GEN8_GMUCX_POWER_COUNTER_XOCLK_L_4,
  2070. &busy->num_ifpc);
  2071. adreno_dev->ifpc_count += ifpc;
  2072. if (ifpc > 0)
  2073. trace_adreno_ifpc_count(adreno_dev->ifpc_count);
  2074. }
  2075. if (device->pwrctrl.bus_control)
  2076. gen8_read_bus_stats(device, stats, busy);
  2077. if (adreno_dev->bcl_enabled) {
  2078. u32 a, b, c, bcl_throttle;
  2079. a = counter_delta(device, GEN8_GMUCX_POWER_COUNTER_XOCLK_L_1,
  2080. &busy->throttle_cycles[0]);
  2081. b = counter_delta(device, GEN8_GMUCX_POWER_COUNTER_XOCLK_L_2,
  2082. &busy->throttle_cycles[1]);
  2083. c = counter_delta(device, GEN8_GMUCX_POWER_COUNTER_XOCLK_L_3,
  2084. &busy->throttle_cycles[2]);
  2085. if (a || b || c)
  2086. trace_kgsl_bcl_clock_throttling(a, b, c);
  2087. bcl_throttle = counter_delta(device,
  2088. GEN8_GMUCX_POWER_COUNTER_XOCLK_L_5, &busy->bcl_throttle);
  2089. /*
  2090. * This counts number of cycles throttled in XO cycles. Convert it to
  2091. * micro seconds by dividing by XO freq which is 19.2MHz.
  2092. */
  2093. adreno_dev->bcl_throttle_time_us += ((bcl_throttle * 10) / 192);
  2094. }
  2095. }
  2096. static int gen8_setproperty(struct kgsl_device_private *dev_priv,
  2097. u32 type, void __user *value, u32 sizebytes)
  2098. {
  2099. struct kgsl_device *device = dev_priv->device;
  2100. struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
  2101. u32 enable;
  2102. if (type != KGSL_PROP_PWRCTRL)
  2103. return -ENODEV;
  2104. if (sizebytes != sizeof(enable))
  2105. return -EINVAL;
  2106. if (copy_from_user(&enable, value, sizeof(enable)))
  2107. return -EFAULT;
  2108. mutex_lock(&device->mutex);
  2109. if (enable) {
  2110. clear_bit(GMU_DISABLE_SLUMBER, &device->gmu_core.flags);
  2111. kgsl_pwrscale_enable(device);
  2112. } else {
  2113. set_bit(GMU_DISABLE_SLUMBER, &device->gmu_core.flags);
  2114. if (!adreno_active_count_get(adreno_dev))
  2115. adreno_active_count_put(adreno_dev);
  2116. kgsl_pwrscale_disable(device, true);
  2117. }
  2118. mutex_unlock(&device->mutex);
  2119. return 0;
  2120. }
  2121. static void gen8_set_isdb_breakpoint_registers(struct adreno_device *adreno_dev)
  2122. {
  2123. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  2124. struct clk *clk;
  2125. int ret;
  2126. if (!device->set_isdb_breakpoint || device->ftbl->is_hwcg_on(device)
  2127. || device->qdss_gfx_virt == NULL || !device->force_panic)
  2128. return;
  2129. clk = clk_get(&device->pdev->dev, "apb_pclk");
  2130. if (IS_ERR(clk)) {
  2131. dev_err(device->dev, "Unable to get QDSS clock\n");
  2132. goto err;
  2133. }
  2134. ret = clk_prepare_enable(clk);
  2135. if (ret) {
  2136. dev_err(device->dev, "QDSS Clock enable error: %d\n", ret);
  2137. clk_put(clk);
  2138. goto err;
  2139. }
  2140. /* Issue break command for SPs */
  2141. isdb_write(device->qdss_gfx_virt, 0x0000);
  2142. isdb_write(device->qdss_gfx_virt, 0x1000);
  2143. isdb_write(device->qdss_gfx_virt, 0x2000);
  2144. isdb_write(device->qdss_gfx_virt, 0x3000);
  2145. isdb_write(device->qdss_gfx_virt, 0x4000);
  2146. isdb_write(device->qdss_gfx_virt, 0x5000);
  2147. isdb_write(device->qdss_gfx_virt, 0x6000);
  2148. isdb_write(device->qdss_gfx_virt, 0x7000);
  2149. isdb_write(device->qdss_gfx_virt, 0x8000);
  2150. isdb_write(device->qdss_gfx_virt, 0x9000);
  2151. isdb_write(device->qdss_gfx_virt, 0xa000);
  2152. isdb_write(device->qdss_gfx_virt, 0xb000);
  2153. clk_disable_unprepare(clk);
  2154. clk_put(clk);
  2155. return;
  2156. err:
  2157. /* Do not force kernel panic if isdb writes did not go through */
  2158. device->force_panic = false;
  2159. }
  2160. static void gen8_swfuse_irqctrl(struct adreno_device *adreno_dev, bool state)
  2161. {
  2162. kgsl_regwrite(KGSL_DEVICE(adreno_dev), GEN8_RBBM_SW_FUSE_INT_MASK,
  2163. state ? GEN8_SW_FUSE_INT_MASK : 0);
  2164. }
  2165. static void gen8_lpac_fault_header(struct adreno_device *adreno_dev,
  2166. struct kgsl_drawobj *drawobj)
  2167. {
  2168. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  2169. struct adreno_context *drawctxt;
  2170. u32 status = 0, rptr = 0, wptr = 0, ib1sz = 0, ib2sz = 0, ib3sz = 0;
  2171. u64 ib1base = 0, ib2base = 0, ib3base = 0;
  2172. bool gx_on = adreno_gx_is_on(adreno_dev);
  2173. drawctxt = ADRENO_CONTEXT(drawobj->context);
  2174. drawobj->context->last_faulted_cmd_ts = drawobj->timestamp;
  2175. drawobj->context->total_fault_count++;
  2176. pr_context(device, drawobj->context,
  2177. "LPAC ctx %u ctx_type %s ts %u policy %lX dispatch_queue=%d\n",
  2178. drawobj->context->id, kgsl_context_type(drawctxt->type),
  2179. drawobj->timestamp, CMDOBJ(drawobj)->fault_recovery,
  2180. drawobj->context->gmu_dispatch_queue);
  2181. pr_context(device, drawobj->context, "lpac cmdline: %s\n",
  2182. drawctxt->base.proc_priv->cmdline);
  2183. if (!gen8_gmu_rpmh_pwr_state_is_active(device) || !gx_on)
  2184. goto done;
  2185. kgsl_regread(device, GEN8_RBBM_LPAC_STATUS, &status);
  2186. kgsl_regread(device, GEN8_CP_RB_RPTR_LPAC, &rptr);
  2187. kgsl_regread(device, GEN8_CP_RB_WPTR_LPAC, &wptr);
  2188. gen8_regread64_aperture(device, GEN8_CP_IB1_BASE_LO_PIPE,
  2189. GEN8_CP_IB1_BASE_HI_PIPE, &ib1base, PIPE_LPAC, 0, 0);
  2190. gen8_regread_aperture(device, GEN8_CP_IB1_REM_SIZE_PIPE, &ib1sz, PIPE_LPAC, 0, 0);
  2191. gen8_regread64_aperture(device, GEN8_CP_IB2_BASE_LO_PIPE,
  2192. GEN8_CP_IB2_BASE_HI_PIPE, &ib2base, PIPE_LPAC, 0, 0);
  2193. gen8_regread_aperture(device, GEN8_CP_IB2_REM_SIZE_PIPE, &ib2sz, PIPE_LPAC, 0, 0);
  2194. gen8_regread64_aperture(device, GEN8_CP_IB3_BASE_LO_PIPE,
  2195. GEN8_CP_IB3_BASE_HI_PIPE, &ib3base, PIPE_LPAC, 0, 0);
  2196. gen8_regread_aperture(device, GEN8_CP_IB3_REM_SIZE_PIPE, &ib3sz, PIPE_LPAC, 0, 0);
  2197. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  2198. pr_context(device, drawobj->context,
  2199. "LPAC: status %8.8X rb %4.4x/%4.4x ib1 %16.16llX/%4.4x ib2 %16.16llX/%4.4x ib3 %16.16llX/%4.4x\n",
  2200. status, rptr, wptr, ib1base, ib1sz, ib2base, ib2sz, ib3base, ib3sz);
  2201. done:
  2202. trace_adreno_gpu_fault(drawobj->context->id, drawobj->timestamp, status,
  2203. rptr, wptr, ib1base, ib1sz, ib2base, ib2sz,
  2204. adreno_get_level(drawobj->context));
  2205. }
  2206. static void gen8_fault_header(struct adreno_device *adreno_dev,
  2207. struct kgsl_drawobj *drawobj)
  2208. {
  2209. struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
  2210. struct adreno_context *drawctxt;
  2211. u32 status = 0, rptr = 0, wptr = 0, ib1sz = 0, ib2sz = 0, ib3sz, rptr_bv = 0;
  2212. u32 ib1sz_bv = 0, ib2sz_bv = 0, ib3sz_bv, gfx_status, gfx_br_status, gfx_bv_status;
  2213. u64 ib1base = 0, ib2base = 0, ib3base, ib1base_bv = 0, ib2base_bv, ib3base_bv;
  2214. u32 ctxt_id = 0, ts = 0;
  2215. int rb_id = -1;
  2216. bool gx_on = adreno_gx_is_on(adreno_dev);
  2217. if (drawobj) {
  2218. drawctxt = ADRENO_CONTEXT(drawobj->context);
  2219. drawobj->context->last_faulted_cmd_ts = drawobj->timestamp;
  2220. drawobj->context->total_fault_count++;
  2221. ctxt_id = drawobj->context->id;
  2222. ts = drawobj->timestamp;
  2223. rb_id = adreno_get_level(drawobj->context);
  2224. pr_context(device, drawobj->context, "ctx %u ctx_type %s ts %u policy %lX\n",
  2225. drawobj->context->id, kgsl_context_type(drawctxt->type),
  2226. drawobj->timestamp, CMDOBJ(drawobj)->fault_recovery);
  2227. pr_context(device, drawobj->context, "cmdline: %s\n",
  2228. drawctxt->base.proc_priv->cmdline);
  2229. }
  2230. if (!gen8_gmu_rpmh_pwr_state_is_active(device) || !gx_on)
  2231. goto done;
  2232. kgsl_regread(device, GEN8_RBBM_STATUS, &status);
  2233. kgsl_regread(device, GEN8_RBBM_GFX_STATUS, &gfx_status);
  2234. kgsl_regread(device, GEN8_RBBM_GFX_BV_STATUS, &gfx_bv_status);
  2235. kgsl_regread(device, GEN8_RBBM_GFX_BR_STATUS, &gfx_br_status);
  2236. kgsl_regread(device, GEN8_CP_RB_RPTR_BR, &rptr);
  2237. kgsl_regread(device, GEN8_CP_RB_WPTR_GC, &wptr);
  2238. kgsl_regread(device, GEN8_CP_RB_RPTR_BV, &rptr_bv);
  2239. gen8_regread64_aperture(device, GEN8_CP_IB1_BASE_LO_PIPE,
  2240. GEN8_CP_IB1_BASE_HI_PIPE, &ib1base, PIPE_BR, 0, 0);
  2241. gen8_regread_aperture(device, GEN8_CP_IB1_REM_SIZE_PIPE, &ib1sz, PIPE_BR, 0, 0);
  2242. gen8_regread64_aperture(device, GEN8_CP_IB2_BASE_LO_PIPE,
  2243. GEN8_CP_IB2_BASE_HI_PIPE, &ib2base, PIPE_BR, 0, 0);
  2244. gen8_regread_aperture(device, GEN8_CP_IB2_REM_SIZE_PIPE, &ib2sz, PIPE_BR, 0, 0);
  2245. gen8_regread64_aperture(device, GEN8_CP_IB3_BASE_LO_PIPE,
  2246. GEN8_CP_IB3_BASE_HI_PIPE, &ib3base, PIPE_BR, 0, 0);
  2247. gen8_regread_aperture(device, GEN8_CP_IB3_REM_SIZE_PIPE, &ib3sz, PIPE_BR, 0, 0);
  2248. gen8_regread64_aperture(device, GEN8_CP_IB1_BASE_LO_PIPE,
  2249. GEN8_CP_IB1_BASE_HI_PIPE, &ib1base_bv, PIPE_BV, 0, 0);
  2250. gen8_regread_aperture(device, GEN8_CP_IB1_REM_SIZE_PIPE, &ib1sz_bv, PIPE_BV, 0, 0);
  2251. gen8_regread64_aperture(device, GEN8_CP_IB2_BASE_LO_PIPE,
  2252. GEN8_CP_IB2_BASE_HI_PIPE, &ib2base_bv, PIPE_BV, 0, 0);
  2253. gen8_regread_aperture(device, GEN8_CP_IB2_REM_SIZE_PIPE, &ib2sz_bv, PIPE_BV, 0, 0);
  2254. gen8_regread64_aperture(device, GEN8_CP_IB3_BASE_LO_PIPE,
  2255. GEN8_CP_IB3_BASE_HI_PIPE, &ib3base_bv, PIPE_BV, 0, 0);
  2256. gen8_regread_aperture(device, GEN8_CP_IB3_REM_SIZE_PIPE, &ib3sz_bv, PIPE_BV, 0, 0);
  2257. gen8_host_aperture_set(adreno_dev, 0, 0, 0);
  2258. dev_err(device->dev,
  2259. "status %8.8X gfx_status %8.8X gfx_br_status %8.8X gfx_bv_status %8.8X\n",
  2260. status, gfx_status, gfx_br_status, gfx_bv_status);
  2261. dev_err(device->dev,
  2262. "BR: rb %4.4x/%4.4x ib1 %16.16llX/%4.4x ib2 %16.16llX/%4.4x ib3 %16.16llX/%4.4x\n",
  2263. rptr, wptr, ib1base, ib1sz, ib2base, ib2sz, ib3base, ib3sz);
  2264. dev_err(device->dev,
  2265. "BV: rb %4.4x/%4.4x ib1 %16.16llX/%4.4x ib2 %16.16llX/%4.4x ib3 %16.16llX/%4.4x\n",
  2266. rptr_bv, wptr, ib1base_bv, ib1sz_bv, ib2base_bv, ib2sz_bv, ib3base_bv, ib3sz_bv);
  2267. done:
  2268. trace_adreno_gpu_fault(ctxt_id, ts, status,
  2269. rptr, wptr, ib1base, ib1sz, ib2base, ib2sz, rb_id);
  2270. }
  2271. const struct gen8_gpudev adreno_gen8_hwsched_gpudev = {
  2272. .base = {
  2273. .reg_offsets = gen8_register_offsets,
  2274. .probe = gen8_hwsched_probe,
  2275. .snapshot = gen8_hwsched_snapshot,
  2276. .irq_handler = gen8_irq_handler,
  2277. .iommu_fault_block = gen8_iommu_fault_block,
  2278. .preemption_context_init = gen8_preemption_context_init,
  2279. .context_detach = gen8_hwsched_context_detach,
  2280. .read_alwayson = gen8_read_alwayson,
  2281. .reset = gen8_hwsched_reset_replay,
  2282. .power_ops = &gen8_hwsched_power_ops,
  2283. .power_stats = gen8_power_stats,
  2284. .setproperty = gen8_setproperty,
  2285. .hw_isidle = gen8_hw_isidle,
  2286. .add_to_va_minidump = gen8_hwsched_add_to_minidump,
  2287. .gx_is_on = gen8_gmu_gx_is_on,
  2288. .send_recurring_cmdobj = gen8_hwsched_send_recurring_cmdobj,
  2289. .perfcounter_remove = gen8_perfcounter_remove,
  2290. .set_isdb_breakpoint_registers = gen8_set_isdb_breakpoint_registers,
  2291. .context_destroy = gen8_hwsched_context_destroy,
  2292. .lpac_store = gen8_lpac_store,
  2293. .get_uche_trap_base = gen8_get_uche_trap_base,
  2294. .fault_header = gen8_fault_header,
  2295. .lpac_fault_header = gen8_lpac_fault_header,
  2296. },
  2297. .hfi_probe = gen8_hwsched_hfi_probe,
  2298. .hfi_remove = gen8_hwsched_hfi_remove,
  2299. .handle_watchdog = gen8_hwsched_handle_watchdog,
  2300. };
  2301. const struct gen8_gpudev adreno_gen8_gmu_gpudev = {
  2302. .base = {
  2303. .reg_offsets = gen8_register_offsets,
  2304. .probe = gen8_gmu_device_probe,
  2305. .snapshot = gen8_gmu_snapshot,
  2306. .irq_handler = gen8_irq_handler,
  2307. .rb_start = gen8_rb_start,
  2308. .gpu_keepalive = gen8_gpu_keepalive,
  2309. .hw_isidle = gen8_hw_isidle,
  2310. .iommu_fault_block = gen8_iommu_fault_block,
  2311. .reset = gen8_gmu_reset,
  2312. .preemption_schedule = gen8_preemption_schedule,
  2313. .preemption_context_init = gen8_preemption_context_init,
  2314. .read_alwayson = gen8_read_alwayson,
  2315. .power_ops = &gen8_gmu_power_ops,
  2316. .remove = gen8_remove,
  2317. .ringbuffer_submitcmd = gen8_ringbuffer_submitcmd,
  2318. .power_stats = gen8_power_stats,
  2319. .setproperty = gen8_setproperty,
  2320. .add_to_va_minidump = gen8_gmu_add_to_minidump,
  2321. .gx_is_on = gen8_gmu_gx_is_on,
  2322. .perfcounter_remove = gen8_perfcounter_remove,
  2323. .set_isdb_breakpoint_registers = gen8_set_isdb_breakpoint_registers,
  2324. .swfuse_irqctrl = gen8_swfuse_irqctrl,
  2325. .get_uche_trap_base = gen8_get_uche_trap_base,
  2326. .fault_header = gen8_fault_header,
  2327. },
  2328. .hfi_probe = gen8_gmu_hfi_probe,
  2329. .handle_watchdog = gen8_gmu_handle_watchdog,
  2330. };