etnaviv_perfmon.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Copyright (C) 2017 Etnaviv Project
  4. * Copyright (C) 2017 Zodiac Inflight Innovations
  5. */
  6. #include "etnaviv_gpu.h"
  7. #include "etnaviv_perfmon.h"
  8. #include "state_hi.xml.h"
  9. struct etnaviv_pm_domain;
  10. struct etnaviv_pm_signal {
  11. char name[64];
  12. u32 data;
  13. u32 (*sample)(struct etnaviv_gpu *gpu,
  14. const struct etnaviv_pm_domain *domain,
  15. const struct etnaviv_pm_signal *signal);
  16. };
  17. struct etnaviv_pm_domain {
  18. char name[64];
  19. /* profile register */
  20. u32 profile_read;
  21. u32 profile_config;
  22. u8 nr_signals;
  23. const struct etnaviv_pm_signal *signal;
  24. };
  25. struct etnaviv_pm_domain_meta {
  26. const struct etnaviv_pm_domain *domains;
  27. u32 nr_domains;
  28. };
  29. static u32 simple_reg_read(struct etnaviv_gpu *gpu,
  30. const struct etnaviv_pm_domain *domain,
  31. const struct etnaviv_pm_signal *signal)
  32. {
  33. return gpu_read(gpu, signal->data);
  34. }
  35. static u32 perf_reg_read(struct etnaviv_gpu *gpu,
  36. const struct etnaviv_pm_domain *domain,
  37. const struct etnaviv_pm_signal *signal)
  38. {
  39. gpu_write(gpu, domain->profile_config, signal->data);
  40. return gpu_read(gpu, domain->profile_read);
  41. }
  42. static u32 pipe_reg_read(struct etnaviv_gpu *gpu,
  43. const struct etnaviv_pm_domain *domain,
  44. const struct etnaviv_pm_signal *signal)
  45. {
  46. u32 clock = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
  47. u32 value = 0;
  48. unsigned i;
  49. for (i = 0; i < gpu->identity.pixel_pipes; i++) {
  50. clock &= ~(VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE__MASK);
  51. clock |= VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE(i);
  52. gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, clock);
  53. gpu_write(gpu, domain->profile_config, signal->data);
  54. value += gpu_read(gpu, domain->profile_read);
  55. }
  56. /* switch back to pixel pipe 0 to prevent GPU hang */
  57. clock &= ~(VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE__MASK);
  58. clock |= VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE(0);
  59. gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, clock);
  60. return value;
  61. }
  62. static const struct etnaviv_pm_domain doms_3d[] = {
  63. {
  64. .name = "HI",
  65. .profile_read = VIVS_MC_PROFILE_HI_READ,
  66. .profile_config = VIVS_MC_PROFILE_CONFIG2,
  67. .nr_signals = 5,
  68. .signal = (const struct etnaviv_pm_signal[]) {
  69. {
  70. "TOTAL_CYCLES",
  71. VIVS_HI_PROFILE_TOTAL_CYCLES,
  72. &simple_reg_read
  73. },
  74. {
  75. "IDLE_CYCLES",
  76. VIVS_HI_PROFILE_IDLE_CYCLES,
  77. &simple_reg_read
  78. },
  79. {
  80. "AXI_CYCLES_READ_REQUEST_STALLED",
  81. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_READ_REQUEST_STALLED,
  82. &perf_reg_read
  83. },
  84. {
  85. "AXI_CYCLES_WRITE_REQUEST_STALLED",
  86. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_REQUEST_STALLED,
  87. &perf_reg_read
  88. },
  89. {
  90. "AXI_CYCLES_WRITE_DATA_STALLED",
  91. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_DATA_STALLED,
  92. &perf_reg_read
  93. }
  94. }
  95. },
  96. {
  97. .name = "PE",
  98. .profile_read = VIVS_MC_PROFILE_PE_READ,
  99. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  100. .nr_signals = 5,
  101. .signal = (const struct etnaviv_pm_signal[]) {
  102. {
  103. "PIXEL_COUNT_KILLED_BY_COLOR_PIPE",
  104. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_COLOR_PIPE,
  105. &pipe_reg_read
  106. },
  107. {
  108. "PIXEL_COUNT_KILLED_BY_DEPTH_PIPE",
  109. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_DEPTH_PIPE,
  110. &pipe_reg_read
  111. },
  112. {
  113. "PIXEL_COUNT_DRAWN_BY_COLOR_PIPE",
  114. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_COLOR_PIPE,
  115. &pipe_reg_read
  116. },
  117. {
  118. "PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE",
  119. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE,
  120. &pipe_reg_read
  121. }
  122. }
  123. },
  124. {
  125. .name = "SH",
  126. .profile_read = VIVS_MC_PROFILE_SH_READ,
  127. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  128. .nr_signals = 9,
  129. .signal = (const struct etnaviv_pm_signal[]) {
  130. {
  131. "SHADER_CYCLES",
  132. VIVS_MC_PROFILE_CONFIG0_SH_SHADER_CYCLES,
  133. &perf_reg_read
  134. },
  135. {
  136. "PS_INST_COUNTER",
  137. VIVS_MC_PROFILE_CONFIG0_SH_PS_INST_COUNTER,
  138. &perf_reg_read
  139. },
  140. {
  141. "RENDERED_PIXEL_COUNTER",
  142. VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_PIXEL_COUNTER,
  143. &perf_reg_read
  144. },
  145. {
  146. "VS_INST_COUNTER",
  147. VIVS_MC_PROFILE_CONFIG0_SH_VS_INST_COUNTER,
  148. &pipe_reg_read
  149. },
  150. {
  151. "RENDERED_VERTICE_COUNTER",
  152. VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_VERTICE_COUNTER,
  153. &pipe_reg_read
  154. },
  155. {
  156. "VTX_BRANCH_INST_COUNTER",
  157. VIVS_MC_PROFILE_CONFIG0_SH_VTX_BRANCH_INST_COUNTER,
  158. &pipe_reg_read
  159. },
  160. {
  161. "VTX_TEXLD_INST_COUNTER",
  162. VIVS_MC_PROFILE_CONFIG0_SH_VTX_TEXLD_INST_COUNTER,
  163. &pipe_reg_read
  164. },
  165. {
  166. "PXL_BRANCH_INST_COUNTER",
  167. VIVS_MC_PROFILE_CONFIG0_SH_PXL_BRANCH_INST_COUNTER,
  168. &pipe_reg_read
  169. },
  170. {
  171. "PXL_TEXLD_INST_COUNTER",
  172. VIVS_MC_PROFILE_CONFIG0_SH_PXL_TEXLD_INST_COUNTER,
  173. &pipe_reg_read
  174. }
  175. }
  176. },
  177. {
  178. .name = "PA",
  179. .profile_read = VIVS_MC_PROFILE_PA_READ,
  180. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  181. .nr_signals = 6,
  182. .signal = (const struct etnaviv_pm_signal[]) {
  183. {
  184. "INPUT_VTX_COUNTER",
  185. VIVS_MC_PROFILE_CONFIG1_PA_INPUT_VTX_COUNTER,
  186. &perf_reg_read
  187. },
  188. {
  189. "INPUT_PRIM_COUNTER",
  190. VIVS_MC_PROFILE_CONFIG1_PA_INPUT_PRIM_COUNTER,
  191. &perf_reg_read
  192. },
  193. {
  194. "OUTPUT_PRIM_COUNTER",
  195. VIVS_MC_PROFILE_CONFIG1_PA_OUTPUT_PRIM_COUNTER,
  196. &perf_reg_read
  197. },
  198. {
  199. "DEPTH_CLIPPED_COUNTER",
  200. VIVS_MC_PROFILE_CONFIG1_PA_DEPTH_CLIPPED_COUNTER,
  201. &pipe_reg_read
  202. },
  203. {
  204. "TRIVIAL_REJECTED_COUNTER",
  205. VIVS_MC_PROFILE_CONFIG1_PA_TRIVIAL_REJECTED_COUNTER,
  206. &pipe_reg_read
  207. },
  208. {
  209. "CULLED_COUNTER",
  210. VIVS_MC_PROFILE_CONFIG1_PA_CULLED_COUNTER,
  211. &pipe_reg_read
  212. }
  213. }
  214. },
  215. {
  216. .name = "SE",
  217. .profile_read = VIVS_MC_PROFILE_SE_READ,
  218. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  219. .nr_signals = 2,
  220. .signal = (const struct etnaviv_pm_signal[]) {
  221. {
  222. "CULLED_TRIANGLE_COUNT",
  223. VIVS_MC_PROFILE_CONFIG1_SE_CULLED_TRIANGLE_COUNT,
  224. &perf_reg_read
  225. },
  226. {
  227. "CULLED_LINES_COUNT",
  228. VIVS_MC_PROFILE_CONFIG1_SE_CULLED_LINES_COUNT,
  229. &perf_reg_read
  230. }
  231. }
  232. },
  233. {
  234. .name = "RA",
  235. .profile_read = VIVS_MC_PROFILE_RA_READ,
  236. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  237. .nr_signals = 7,
  238. .signal = (const struct etnaviv_pm_signal[]) {
  239. {
  240. "VALID_PIXEL_COUNT",
  241. VIVS_MC_PROFILE_CONFIG1_RA_VALID_PIXEL_COUNT,
  242. &perf_reg_read
  243. },
  244. {
  245. "TOTAL_QUAD_COUNT",
  246. VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_QUAD_COUNT,
  247. &perf_reg_read
  248. },
  249. {
  250. "VALID_QUAD_COUNT_AFTER_EARLY_Z",
  251. VIVS_MC_PROFILE_CONFIG1_RA_VALID_QUAD_COUNT_AFTER_EARLY_Z,
  252. &perf_reg_read
  253. },
  254. {
  255. "TOTAL_PRIMITIVE_COUNT",
  256. VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_PRIMITIVE_COUNT,
  257. &perf_reg_read
  258. },
  259. {
  260. "PIPE_CACHE_MISS_COUNTER",
  261. VIVS_MC_PROFILE_CONFIG1_RA_PIPE_CACHE_MISS_COUNTER,
  262. &perf_reg_read
  263. },
  264. {
  265. "PREFETCH_CACHE_MISS_COUNTER",
  266. VIVS_MC_PROFILE_CONFIG1_RA_PREFETCH_CACHE_MISS_COUNTER,
  267. &perf_reg_read
  268. },
  269. {
  270. "CULLED_QUAD_COUNT",
  271. VIVS_MC_PROFILE_CONFIG1_RA_CULLED_QUAD_COUNT,
  272. &perf_reg_read
  273. }
  274. }
  275. },
  276. {
  277. .name = "TX",
  278. .profile_read = VIVS_MC_PROFILE_TX_READ,
  279. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  280. .nr_signals = 9,
  281. .signal = (const struct etnaviv_pm_signal[]) {
  282. {
  283. "TOTAL_BILINEAR_REQUESTS",
  284. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_BILINEAR_REQUESTS,
  285. &perf_reg_read
  286. },
  287. {
  288. "TOTAL_TRILINEAR_REQUESTS",
  289. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TRILINEAR_REQUESTS,
  290. &perf_reg_read
  291. },
  292. {
  293. "TOTAL_DISCARDED_TEXTURE_REQUESTS",
  294. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_DISCARDED_TEXTURE_REQUESTS,
  295. &perf_reg_read
  296. },
  297. {
  298. "TOTAL_TEXTURE_REQUESTS",
  299. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TEXTURE_REQUESTS,
  300. &perf_reg_read
  301. },
  302. {
  303. "MEM_READ_COUNT",
  304. VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_COUNT,
  305. &perf_reg_read
  306. },
  307. {
  308. "MEM_READ_IN_8B_COUNT",
  309. VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_IN_8B_COUNT,
  310. &perf_reg_read
  311. },
  312. {
  313. "CACHE_MISS_COUNT",
  314. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_COUNT,
  315. &perf_reg_read
  316. },
  317. {
  318. "CACHE_HIT_TEXEL_COUNT",
  319. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_HIT_TEXEL_COUNT,
  320. &perf_reg_read
  321. },
  322. {
  323. "CACHE_MISS_TEXEL_COUNT",
  324. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_TEXEL_COUNT,
  325. &perf_reg_read
  326. }
  327. }
  328. },
  329. {
  330. .name = "MC",
  331. .profile_read = VIVS_MC_PROFILE_MC_READ,
  332. .profile_config = VIVS_MC_PROFILE_CONFIG2,
  333. .nr_signals = 3,
  334. .signal = (const struct etnaviv_pm_signal[]) {
  335. {
  336. "TOTAL_READ_REQ_8B_FROM_PIPELINE",
  337. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_PIPELINE,
  338. &perf_reg_read
  339. },
  340. {
  341. "TOTAL_READ_REQ_8B_FROM_IP",
  342. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_IP,
  343. &perf_reg_read
  344. },
  345. {
  346. "TOTAL_WRITE_REQ_8B_FROM_PIPELINE",
  347. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_WRITE_REQ_8B_FROM_PIPELINE,
  348. &perf_reg_read
  349. }
  350. }
  351. }
  352. };
  353. static const struct etnaviv_pm_domain doms_2d[] = {
  354. {
  355. .name = "PE",
  356. .profile_read = VIVS_MC_PROFILE_PE_READ,
  357. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  358. .nr_signals = 1,
  359. .signal = (const struct etnaviv_pm_signal[]) {
  360. {
  361. "PIXELS_RENDERED_2D",
  362. VIVS_MC_PROFILE_CONFIG0_PE_PIXELS_RENDERED_2D,
  363. &pipe_reg_read
  364. }
  365. }
  366. }
  367. };
  368. static const struct etnaviv_pm_domain doms_vg[] = {
  369. };
  370. static const struct etnaviv_pm_domain_meta doms_meta[] = {
  371. {
  372. .nr_domains = ARRAY_SIZE(doms_3d),
  373. .domains = &doms_3d[0]
  374. },
  375. {
  376. .nr_domains = ARRAY_SIZE(doms_2d),
  377. .domains = &doms_2d[0]
  378. },
  379. {
  380. .nr_domains = ARRAY_SIZE(doms_vg),
  381. .domains = &doms_vg[0]
  382. }
  383. };
  384. int etnaviv_pm_query_dom(struct etnaviv_gpu *gpu,
  385. struct drm_etnaviv_pm_domain *domain)
  386. {
  387. const struct etnaviv_pm_domain_meta *meta = &doms_meta[domain->pipe];
  388. const struct etnaviv_pm_domain *dom;
  389. if (domain->iter >= meta->nr_domains)
  390. return -EINVAL;
  391. dom = meta->domains + domain->iter;
  392. domain->id = domain->iter;
  393. domain->nr_signals = dom->nr_signals;
  394. strncpy(domain->name, dom->name, sizeof(domain->name));
  395. domain->iter++;
  396. if (domain->iter == meta->nr_domains)
  397. domain->iter = 0xff;
  398. return 0;
  399. }
  400. int etnaviv_pm_query_sig(struct etnaviv_gpu *gpu,
  401. struct drm_etnaviv_pm_signal *signal)
  402. {
  403. const struct etnaviv_pm_domain_meta *meta = &doms_meta[signal->pipe];
  404. const struct etnaviv_pm_domain *dom;
  405. const struct etnaviv_pm_signal *sig;
  406. if (signal->domain >= meta->nr_domains)
  407. return -EINVAL;
  408. dom = meta->domains + signal->domain;
  409. if (signal->iter > dom->nr_signals)
  410. return -EINVAL;
  411. sig = &dom->signal[signal->iter];
  412. signal->id = signal->iter;
  413. strncpy(signal->name, sig->name, sizeof(signal->name));
  414. signal->iter++;
  415. if (signal->iter == dom->nr_signals)
  416. signal->iter = 0xffff;
  417. return 0;
  418. }
  419. int etnaviv_pm_req_validate(const struct drm_etnaviv_gem_submit_pmr *r,
  420. u32 exec_state)
  421. {
  422. const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
  423. const struct etnaviv_pm_domain *dom;
  424. if (r->domain >= meta->nr_domains)
  425. return -EINVAL;
  426. dom = meta->domains + r->domain;
  427. if (r->signal > dom->nr_signals)
  428. return -EINVAL;
  429. return 0;
  430. }
  431. void etnaviv_perfmon_process(struct etnaviv_gpu *gpu,
  432. const struct etnaviv_perfmon_request *pmr, u32 exec_state)
  433. {
  434. const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
  435. const struct etnaviv_pm_domain *dom;
  436. const struct etnaviv_pm_signal *sig;
  437. u32 *bo = pmr->bo_vma;
  438. u32 val;
  439. dom = meta->domains + pmr->domain;
  440. sig = &dom->signal[pmr->signal];
  441. val = sig->sample(gpu, dom, sig);
  442. *(bo + pmr->offset) = val;
  443. }