etnaviv_perfmon.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Copyright (C) 2017 Etnaviv Project
  4. * Copyright (C) 2017 Zodiac Inflight Innovations
  5. */
  6. #include "common.xml.h"
  7. #include "etnaviv_gpu.h"
  8. #include "etnaviv_perfmon.h"
  9. #include "state_hi.xml.h"
  10. struct etnaviv_pm_domain;
  11. struct etnaviv_pm_signal {
  12. char name[64];
  13. u32 data;
  14. u32 (*sample)(struct etnaviv_gpu *gpu,
  15. const struct etnaviv_pm_domain *domain,
  16. const struct etnaviv_pm_signal *signal);
  17. };
  18. struct etnaviv_pm_domain {
  19. char name[64];
  20. /* profile register */
  21. u32 profile_read;
  22. u32 profile_config;
  23. u8 nr_signals;
  24. const struct etnaviv_pm_signal *signal;
  25. };
  26. struct etnaviv_pm_domain_meta {
  27. unsigned int feature;
  28. const struct etnaviv_pm_domain *domains;
  29. u32 nr_domains;
  30. };
  31. static u32 perf_reg_read(struct etnaviv_gpu *gpu,
  32. const struct etnaviv_pm_domain *domain,
  33. const struct etnaviv_pm_signal *signal)
  34. {
  35. gpu_write(gpu, domain->profile_config, signal->data);
  36. return gpu_read(gpu, domain->profile_read);
  37. }
  38. static inline void pipe_select(struct etnaviv_gpu *gpu, u32 clock, unsigned pipe)
  39. {
  40. clock &= ~(VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE__MASK);
  41. clock |= VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE(pipe);
  42. gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, clock);
  43. }
  44. static u32 pipe_perf_reg_read(struct etnaviv_gpu *gpu,
  45. const struct etnaviv_pm_domain *domain,
  46. const struct etnaviv_pm_signal *signal)
  47. {
  48. u32 clock = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
  49. u32 value = 0;
  50. unsigned i;
  51. for (i = 0; i < gpu->identity.pixel_pipes; i++) {
  52. pipe_select(gpu, clock, i);
  53. value += perf_reg_read(gpu, domain, signal);
  54. }
  55. /* switch back to pixel pipe 0 to prevent GPU hang */
  56. pipe_select(gpu, clock, 0);
  57. return value;
  58. }
  59. static u32 pipe_reg_read(struct etnaviv_gpu *gpu,
  60. const struct etnaviv_pm_domain *domain,
  61. const struct etnaviv_pm_signal *signal)
  62. {
  63. u32 clock = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
  64. u32 value = 0;
  65. unsigned i;
  66. for (i = 0; i < gpu->identity.pixel_pipes; i++) {
  67. pipe_select(gpu, clock, i);
  68. value += gpu_read(gpu, signal->data);
  69. }
  70. /* switch back to pixel pipe 0 to prevent GPU hang */
  71. pipe_select(gpu, clock, 0);
  72. return value;
  73. }
  74. static u32 hi_total_cycle_read(struct etnaviv_gpu *gpu,
  75. const struct etnaviv_pm_domain *domain,
  76. const struct etnaviv_pm_signal *signal)
  77. {
  78. u32 reg = VIVS_HI_PROFILE_TOTAL_CYCLES;
  79. if (gpu->identity.model == chipModel_GC880 ||
  80. gpu->identity.model == chipModel_GC2000 ||
  81. gpu->identity.model == chipModel_GC2100)
  82. reg = VIVS_MC_PROFILE_CYCLE_COUNTER;
  83. return gpu_read(gpu, reg);
  84. }
  85. static u32 hi_total_idle_cycle_read(struct etnaviv_gpu *gpu,
  86. const struct etnaviv_pm_domain *domain,
  87. const struct etnaviv_pm_signal *signal)
  88. {
  89. u32 reg = VIVS_HI_PROFILE_IDLE_CYCLES;
  90. if (gpu->identity.model == chipModel_GC880 ||
  91. gpu->identity.model == chipModel_GC2000 ||
  92. gpu->identity.model == chipModel_GC2100)
  93. reg = VIVS_HI_PROFILE_TOTAL_CYCLES;
  94. return gpu_read(gpu, reg);
  95. }
  96. static const struct etnaviv_pm_domain doms_3d[] = {
  97. {
  98. .name = "HI",
  99. .profile_read = VIVS_MC_PROFILE_HI_READ,
  100. .profile_config = VIVS_MC_PROFILE_CONFIG2,
  101. .nr_signals = 7,
  102. .signal = (const struct etnaviv_pm_signal[]) {
  103. {
  104. "TOTAL_READ_BYTES8",
  105. VIVS_HI_PROFILE_READ_BYTES8,
  106. &pipe_reg_read,
  107. },
  108. {
  109. "TOTAL_WRITE_BYTES8",
  110. VIVS_HI_PROFILE_WRITE_BYTES8,
  111. &pipe_reg_read,
  112. },
  113. {
  114. "TOTAL_CYCLES",
  115. 0,
  116. &hi_total_cycle_read
  117. },
  118. {
  119. "IDLE_CYCLES",
  120. 0,
  121. &hi_total_idle_cycle_read
  122. },
  123. {
  124. "AXI_CYCLES_READ_REQUEST_STALLED",
  125. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_READ_REQUEST_STALLED,
  126. &perf_reg_read
  127. },
  128. {
  129. "AXI_CYCLES_WRITE_REQUEST_STALLED",
  130. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_REQUEST_STALLED,
  131. &perf_reg_read
  132. },
  133. {
  134. "AXI_CYCLES_WRITE_DATA_STALLED",
  135. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_DATA_STALLED,
  136. &perf_reg_read
  137. }
  138. }
  139. },
  140. {
  141. .name = "PE",
  142. .profile_read = VIVS_MC_PROFILE_PE_READ,
  143. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  144. .nr_signals = 4,
  145. .signal = (const struct etnaviv_pm_signal[]) {
  146. {
  147. "PIXEL_COUNT_KILLED_BY_COLOR_PIPE",
  148. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_COLOR_PIPE,
  149. &pipe_perf_reg_read
  150. },
  151. {
  152. "PIXEL_COUNT_KILLED_BY_DEPTH_PIPE",
  153. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_DEPTH_PIPE,
  154. &pipe_perf_reg_read
  155. },
  156. {
  157. "PIXEL_COUNT_DRAWN_BY_COLOR_PIPE",
  158. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_COLOR_PIPE,
  159. &pipe_perf_reg_read
  160. },
  161. {
  162. "PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE",
  163. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE,
  164. &pipe_perf_reg_read
  165. }
  166. }
  167. },
  168. {
  169. .name = "SH",
  170. .profile_read = VIVS_MC_PROFILE_SH_READ,
  171. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  172. .nr_signals = 9,
  173. .signal = (const struct etnaviv_pm_signal[]) {
  174. {
  175. "SHADER_CYCLES",
  176. VIVS_MC_PROFILE_CONFIG0_SH_SHADER_CYCLES,
  177. &perf_reg_read
  178. },
  179. {
  180. "PS_INST_COUNTER",
  181. VIVS_MC_PROFILE_CONFIG0_SH_PS_INST_COUNTER,
  182. &perf_reg_read
  183. },
  184. {
  185. "RENDERED_PIXEL_COUNTER",
  186. VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_PIXEL_COUNTER,
  187. &perf_reg_read
  188. },
  189. {
  190. "VS_INST_COUNTER",
  191. VIVS_MC_PROFILE_CONFIG0_SH_VS_INST_COUNTER,
  192. &pipe_perf_reg_read
  193. },
  194. {
  195. "RENDERED_VERTICE_COUNTER",
  196. VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_VERTICE_COUNTER,
  197. &pipe_perf_reg_read
  198. },
  199. {
  200. "VTX_BRANCH_INST_COUNTER",
  201. VIVS_MC_PROFILE_CONFIG0_SH_VTX_BRANCH_INST_COUNTER,
  202. &pipe_perf_reg_read
  203. },
  204. {
  205. "VTX_TEXLD_INST_COUNTER",
  206. VIVS_MC_PROFILE_CONFIG0_SH_VTX_TEXLD_INST_COUNTER,
  207. &pipe_perf_reg_read
  208. },
  209. {
  210. "PXL_BRANCH_INST_COUNTER",
  211. VIVS_MC_PROFILE_CONFIG0_SH_PXL_BRANCH_INST_COUNTER,
  212. &pipe_perf_reg_read
  213. },
  214. {
  215. "PXL_TEXLD_INST_COUNTER",
  216. VIVS_MC_PROFILE_CONFIG0_SH_PXL_TEXLD_INST_COUNTER,
  217. &pipe_perf_reg_read
  218. }
  219. }
  220. },
  221. {
  222. .name = "PA",
  223. .profile_read = VIVS_MC_PROFILE_PA_READ,
  224. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  225. .nr_signals = 6,
  226. .signal = (const struct etnaviv_pm_signal[]) {
  227. {
  228. "INPUT_VTX_COUNTER",
  229. VIVS_MC_PROFILE_CONFIG1_PA_INPUT_VTX_COUNTER,
  230. &perf_reg_read
  231. },
  232. {
  233. "INPUT_PRIM_COUNTER",
  234. VIVS_MC_PROFILE_CONFIG1_PA_INPUT_PRIM_COUNTER,
  235. &perf_reg_read
  236. },
  237. {
  238. "OUTPUT_PRIM_COUNTER",
  239. VIVS_MC_PROFILE_CONFIG1_PA_OUTPUT_PRIM_COUNTER,
  240. &perf_reg_read
  241. },
  242. {
  243. "DEPTH_CLIPPED_COUNTER",
  244. VIVS_MC_PROFILE_CONFIG1_PA_DEPTH_CLIPPED_COUNTER,
  245. &pipe_perf_reg_read
  246. },
  247. {
  248. "TRIVIAL_REJECTED_COUNTER",
  249. VIVS_MC_PROFILE_CONFIG1_PA_TRIVIAL_REJECTED_COUNTER,
  250. &pipe_perf_reg_read
  251. },
  252. {
  253. "CULLED_COUNTER",
  254. VIVS_MC_PROFILE_CONFIG1_PA_CULLED_COUNTER,
  255. &pipe_perf_reg_read
  256. }
  257. }
  258. },
  259. {
  260. .name = "SE",
  261. .profile_read = VIVS_MC_PROFILE_SE_READ,
  262. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  263. .nr_signals = 2,
  264. .signal = (const struct etnaviv_pm_signal[]) {
  265. {
  266. "CULLED_TRIANGLE_COUNT",
  267. VIVS_MC_PROFILE_CONFIG1_SE_CULLED_TRIANGLE_COUNT,
  268. &perf_reg_read
  269. },
  270. {
  271. "CULLED_LINES_COUNT",
  272. VIVS_MC_PROFILE_CONFIG1_SE_CULLED_LINES_COUNT,
  273. &perf_reg_read
  274. }
  275. }
  276. },
  277. {
  278. .name = "RA",
  279. .profile_read = VIVS_MC_PROFILE_RA_READ,
  280. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  281. .nr_signals = 7,
  282. .signal = (const struct etnaviv_pm_signal[]) {
  283. {
  284. "VALID_PIXEL_COUNT",
  285. VIVS_MC_PROFILE_CONFIG1_RA_VALID_PIXEL_COUNT,
  286. &perf_reg_read
  287. },
  288. {
  289. "TOTAL_QUAD_COUNT",
  290. VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_QUAD_COUNT,
  291. &perf_reg_read
  292. },
  293. {
  294. "VALID_QUAD_COUNT_AFTER_EARLY_Z",
  295. VIVS_MC_PROFILE_CONFIG1_RA_VALID_QUAD_COUNT_AFTER_EARLY_Z,
  296. &perf_reg_read
  297. },
  298. {
  299. "TOTAL_PRIMITIVE_COUNT",
  300. VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_PRIMITIVE_COUNT,
  301. &perf_reg_read
  302. },
  303. {
  304. "PIPE_CACHE_MISS_COUNTER",
  305. VIVS_MC_PROFILE_CONFIG1_RA_PIPE_CACHE_MISS_COUNTER,
  306. &perf_reg_read
  307. },
  308. {
  309. "PREFETCH_CACHE_MISS_COUNTER",
  310. VIVS_MC_PROFILE_CONFIG1_RA_PREFETCH_CACHE_MISS_COUNTER,
  311. &perf_reg_read
  312. },
  313. {
  314. "CULLED_QUAD_COUNT",
  315. VIVS_MC_PROFILE_CONFIG1_RA_CULLED_QUAD_COUNT,
  316. &perf_reg_read
  317. }
  318. }
  319. },
  320. {
  321. .name = "TX",
  322. .profile_read = VIVS_MC_PROFILE_TX_READ,
  323. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  324. .nr_signals = 9,
  325. .signal = (const struct etnaviv_pm_signal[]) {
  326. {
  327. "TOTAL_BILINEAR_REQUESTS",
  328. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_BILINEAR_REQUESTS,
  329. &perf_reg_read
  330. },
  331. {
  332. "TOTAL_TRILINEAR_REQUESTS",
  333. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TRILINEAR_REQUESTS,
  334. &perf_reg_read
  335. },
  336. {
  337. "TOTAL_DISCARDED_TEXTURE_REQUESTS",
  338. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_DISCARDED_TEXTURE_REQUESTS,
  339. &perf_reg_read
  340. },
  341. {
  342. "TOTAL_TEXTURE_REQUESTS",
  343. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TEXTURE_REQUESTS,
  344. &perf_reg_read
  345. },
  346. {
  347. "MEM_READ_COUNT",
  348. VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_COUNT,
  349. &perf_reg_read
  350. },
  351. {
  352. "MEM_READ_IN_8B_COUNT",
  353. VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_IN_8B_COUNT,
  354. &perf_reg_read
  355. },
  356. {
  357. "CACHE_MISS_COUNT",
  358. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_COUNT,
  359. &perf_reg_read
  360. },
  361. {
  362. "CACHE_HIT_TEXEL_COUNT",
  363. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_HIT_TEXEL_COUNT,
  364. &perf_reg_read
  365. },
  366. {
  367. "CACHE_MISS_TEXEL_COUNT",
  368. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_TEXEL_COUNT,
  369. &perf_reg_read
  370. }
  371. }
  372. },
  373. {
  374. .name = "MC",
  375. .profile_read = VIVS_MC_PROFILE_MC_READ,
  376. .profile_config = VIVS_MC_PROFILE_CONFIG2,
  377. .nr_signals = 3,
  378. .signal = (const struct etnaviv_pm_signal[]) {
  379. {
  380. "TOTAL_READ_REQ_8B_FROM_PIPELINE",
  381. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_PIPELINE,
  382. &perf_reg_read
  383. },
  384. {
  385. "TOTAL_READ_REQ_8B_FROM_IP",
  386. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_IP,
  387. &perf_reg_read
  388. },
  389. {
  390. "TOTAL_WRITE_REQ_8B_FROM_PIPELINE",
  391. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_WRITE_REQ_8B_FROM_PIPELINE,
  392. &perf_reg_read
  393. }
  394. }
  395. }
  396. };
  397. static const struct etnaviv_pm_domain doms_2d[] = {
  398. {
  399. .name = "PE",
  400. .profile_read = VIVS_MC_PROFILE_PE_READ,
  401. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  402. .nr_signals = 1,
  403. .signal = (const struct etnaviv_pm_signal[]) {
  404. {
  405. "PIXELS_RENDERED_2D",
  406. VIVS_MC_PROFILE_CONFIG0_PE_PIXELS_RENDERED_2D,
  407. &pipe_perf_reg_read
  408. }
  409. }
  410. }
  411. };
  412. static const struct etnaviv_pm_domain doms_vg[] = {
  413. };
  414. static const struct etnaviv_pm_domain_meta doms_meta[] = {
  415. {
  416. .feature = chipFeatures_PIPE_3D,
  417. .nr_domains = ARRAY_SIZE(doms_3d),
  418. .domains = &doms_3d[0]
  419. },
  420. {
  421. .feature = chipFeatures_PIPE_2D,
  422. .nr_domains = ARRAY_SIZE(doms_2d),
  423. .domains = &doms_2d[0]
  424. },
  425. {
  426. .feature = chipFeatures_PIPE_VG,
  427. .nr_domains = ARRAY_SIZE(doms_vg),
  428. .domains = &doms_vg[0]
  429. }
  430. };
  431. static unsigned int num_pm_domains(const struct etnaviv_gpu *gpu)
  432. {
  433. unsigned int num = 0, i;
  434. for (i = 0; i < ARRAY_SIZE(doms_meta); i++) {
  435. const struct etnaviv_pm_domain_meta *meta = &doms_meta[i];
  436. if (gpu->identity.features & meta->feature)
  437. num += meta->nr_domains;
  438. }
  439. return num;
  440. }
  441. static const struct etnaviv_pm_domain *pm_domain(const struct etnaviv_gpu *gpu,
  442. unsigned int index)
  443. {
  444. const struct etnaviv_pm_domain *domain = NULL;
  445. unsigned int offset = 0, i;
  446. for (i = 0; i < ARRAY_SIZE(doms_meta); i++) {
  447. const struct etnaviv_pm_domain_meta *meta = &doms_meta[i];
  448. if (!(gpu->identity.features & meta->feature))
  449. continue;
  450. if (index - offset >= meta->nr_domains) {
  451. offset += meta->nr_domains;
  452. continue;
  453. }
  454. domain = meta->domains + (index - offset);
  455. }
  456. return domain;
  457. }
  458. int etnaviv_pm_query_dom(struct etnaviv_gpu *gpu,
  459. struct drm_etnaviv_pm_domain *domain)
  460. {
  461. const unsigned int nr_domains = num_pm_domains(gpu);
  462. const struct etnaviv_pm_domain *dom;
  463. if (domain->iter >= nr_domains)
  464. return -EINVAL;
  465. dom = pm_domain(gpu, domain->iter);
  466. if (!dom)
  467. return -EINVAL;
  468. domain->id = domain->iter;
  469. domain->nr_signals = dom->nr_signals;
  470. strncpy(domain->name, dom->name, sizeof(domain->name));
  471. domain->iter++;
  472. if (domain->iter == nr_domains)
  473. domain->iter = 0xff;
  474. return 0;
  475. }
  476. int etnaviv_pm_query_sig(struct etnaviv_gpu *gpu,
  477. struct drm_etnaviv_pm_signal *signal)
  478. {
  479. const unsigned int nr_domains = num_pm_domains(gpu);
  480. const struct etnaviv_pm_domain *dom;
  481. const struct etnaviv_pm_signal *sig;
  482. if (signal->domain >= nr_domains)
  483. return -EINVAL;
  484. dom = pm_domain(gpu, signal->domain);
  485. if (!dom)
  486. return -EINVAL;
  487. if (signal->iter >= dom->nr_signals)
  488. return -EINVAL;
  489. sig = &dom->signal[signal->iter];
  490. signal->id = signal->iter;
  491. strncpy(signal->name, sig->name, sizeof(signal->name));
  492. signal->iter++;
  493. if (signal->iter == dom->nr_signals)
  494. signal->iter = 0xffff;
  495. return 0;
  496. }
  497. int etnaviv_pm_req_validate(const struct drm_etnaviv_gem_submit_pmr *r,
  498. u32 exec_state)
  499. {
  500. const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
  501. const struct etnaviv_pm_domain *dom;
  502. if (r->domain >= meta->nr_domains)
  503. return -EINVAL;
  504. dom = meta->domains + r->domain;
  505. if (r->signal >= dom->nr_signals)
  506. return -EINVAL;
  507. return 0;
  508. }
  509. void etnaviv_perfmon_process(struct etnaviv_gpu *gpu,
  510. const struct etnaviv_perfmon_request *pmr, u32 exec_state)
  511. {
  512. const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
  513. const struct etnaviv_pm_domain *dom;
  514. const struct etnaviv_pm_signal *sig;
  515. u32 *bo = pmr->bo_vma;
  516. u32 val;
  517. dom = meta->domains + pmr->domain;
  518. sig = &dom->signal[pmr->signal];
  519. val = sig->sample(gpu, dom, sig);
  520. *(bo + pmr->offset) = val;
  521. }