etnaviv_perfmon.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495
  1. /*
  2. * Copyright (C) 2017 Etnaviv Project
  3. * Copyright (C) 2017 Zodiac Inflight Innovations
  4. *
  5. * This program is free software; you can redistribute it and/or modify it
  6. * under the terms of the GNU General Public License version 2 as published by
  7. * the Free Software Foundation.
  8. *
  9. * This program is distributed in the hope that it will be useful, but WITHOUT
  10. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  12. * more details.
  13. *
  14. * You should have received a copy of the GNU General Public License along with
  15. * this program. If not, see <http://www.gnu.org/licenses/>.
  16. */
  17. #include "etnaviv_gpu.h"
  18. #include "etnaviv_perfmon.h"
  19. #include "state_hi.xml.h"
  20. struct etnaviv_pm_domain;
  21. struct etnaviv_pm_signal {
  22. char name[64];
  23. u32 data;
  24. u32 (*sample)(struct etnaviv_gpu *gpu,
  25. const struct etnaviv_pm_domain *domain,
  26. const struct etnaviv_pm_signal *signal);
  27. };
  28. struct etnaviv_pm_domain {
  29. char name[64];
  30. /* profile register */
  31. u32 profile_read;
  32. u32 profile_config;
  33. u8 nr_signals;
  34. const struct etnaviv_pm_signal *signal;
  35. };
  36. struct etnaviv_pm_domain_meta {
  37. const struct etnaviv_pm_domain *domains;
  38. u32 nr_domains;
  39. };
  40. static u32 simple_reg_read(struct etnaviv_gpu *gpu,
  41. const struct etnaviv_pm_domain *domain,
  42. const struct etnaviv_pm_signal *signal)
  43. {
  44. return gpu_read(gpu, signal->data);
  45. }
  46. static u32 perf_reg_read(struct etnaviv_gpu *gpu,
  47. const struct etnaviv_pm_domain *domain,
  48. const struct etnaviv_pm_signal *signal)
  49. {
  50. gpu_write(gpu, domain->profile_config, signal->data);
  51. return gpu_read(gpu, domain->profile_read);
  52. }
  53. static u32 pipe_reg_read(struct etnaviv_gpu *gpu,
  54. const struct etnaviv_pm_domain *domain,
  55. const struct etnaviv_pm_signal *signal)
  56. {
  57. u32 clock = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
  58. u32 value = 0;
  59. unsigned i;
  60. for (i = 0; i < gpu->identity.pixel_pipes; i++) {
  61. clock &= ~(VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE__MASK);
  62. clock |= VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE(i);
  63. gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, clock);
  64. gpu_write(gpu, domain->profile_config, signal->data);
  65. value += gpu_read(gpu, domain->profile_read);
  66. }
  67. /* switch back to pixel pipe 0 to prevent GPU hang */
  68. clock &= ~(VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE__MASK);
  69. clock |= VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE(0);
  70. gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, clock);
  71. return value;
  72. }
  73. static const struct etnaviv_pm_domain doms_3d[] = {
  74. {
  75. .name = "HI",
  76. .profile_read = VIVS_MC_PROFILE_HI_READ,
  77. .profile_config = VIVS_MC_PROFILE_CONFIG2,
  78. .nr_signals = 5,
  79. .signal = (const struct etnaviv_pm_signal[]) {
  80. {
  81. "TOTAL_CYCLES",
  82. VIVS_HI_PROFILE_TOTAL_CYCLES,
  83. &simple_reg_read
  84. },
  85. {
  86. "IDLE_CYCLES",
  87. VIVS_HI_PROFILE_IDLE_CYCLES,
  88. &simple_reg_read
  89. },
  90. {
  91. "AXI_CYCLES_READ_REQUEST_STALLED",
  92. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_READ_REQUEST_STALLED,
  93. &perf_reg_read
  94. },
  95. {
  96. "AXI_CYCLES_WRITE_REQUEST_STALLED",
  97. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_REQUEST_STALLED,
  98. &perf_reg_read
  99. },
  100. {
  101. "AXI_CYCLES_WRITE_DATA_STALLED",
  102. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_DATA_STALLED,
  103. &perf_reg_read
  104. }
  105. }
  106. },
  107. {
  108. .name = "PE",
  109. .profile_read = VIVS_MC_PROFILE_PE_READ,
  110. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  111. .nr_signals = 5,
  112. .signal = (const struct etnaviv_pm_signal[]) {
  113. {
  114. "PIXEL_COUNT_KILLED_BY_COLOR_PIPE",
  115. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_COLOR_PIPE,
  116. &pipe_reg_read
  117. },
  118. {
  119. "PIXEL_COUNT_KILLED_BY_DEPTH_PIPE",
  120. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_DEPTH_PIPE,
  121. &pipe_reg_read
  122. },
  123. {
  124. "PIXEL_COUNT_DRAWN_BY_COLOR_PIPE",
  125. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_COLOR_PIPE,
  126. &pipe_reg_read
  127. },
  128. {
  129. "PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE",
  130. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE,
  131. &pipe_reg_read
  132. }
  133. }
  134. },
  135. {
  136. .name = "SH",
  137. .profile_read = VIVS_MC_PROFILE_SH_READ,
  138. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  139. .nr_signals = 9,
  140. .signal = (const struct etnaviv_pm_signal[]) {
  141. {
  142. "SHADER_CYCLES",
  143. VIVS_MC_PROFILE_CONFIG0_SH_SHADER_CYCLES,
  144. &perf_reg_read
  145. },
  146. {
  147. "PS_INST_COUNTER",
  148. VIVS_MC_PROFILE_CONFIG0_SH_PS_INST_COUNTER,
  149. &perf_reg_read
  150. },
  151. {
  152. "RENDERED_PIXEL_COUNTER",
  153. VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_PIXEL_COUNTER,
  154. &perf_reg_read
  155. },
  156. {
  157. "VS_INST_COUNTER",
  158. VIVS_MC_PROFILE_CONFIG0_SH_VS_INST_COUNTER,
  159. &pipe_reg_read
  160. },
  161. {
  162. "RENDERED_VERTICE_COUNTER",
  163. VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_VERTICE_COUNTER,
  164. &pipe_reg_read
  165. },
  166. {
  167. "VTX_BRANCH_INST_COUNTER",
  168. VIVS_MC_PROFILE_CONFIG0_SH_VTX_BRANCH_INST_COUNTER,
  169. &pipe_reg_read
  170. },
  171. {
  172. "VTX_TEXLD_INST_COUNTER",
  173. VIVS_MC_PROFILE_CONFIG0_SH_VTX_TEXLD_INST_COUNTER,
  174. &pipe_reg_read
  175. },
  176. {
  177. "PXL_BRANCH_INST_COUNTER",
  178. VIVS_MC_PROFILE_CONFIG0_SH_PXL_BRANCH_INST_COUNTER,
  179. &pipe_reg_read
  180. },
  181. {
  182. "PXL_TEXLD_INST_COUNTER",
  183. VIVS_MC_PROFILE_CONFIG0_SH_PXL_TEXLD_INST_COUNTER,
  184. &pipe_reg_read
  185. }
  186. }
  187. },
  188. {
  189. .name = "PA",
  190. .profile_read = VIVS_MC_PROFILE_PA_READ,
  191. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  192. .nr_signals = 6,
  193. .signal = (const struct etnaviv_pm_signal[]) {
  194. {
  195. "INPUT_VTX_COUNTER",
  196. VIVS_MC_PROFILE_CONFIG1_PA_INPUT_VTX_COUNTER,
  197. &perf_reg_read
  198. },
  199. {
  200. "INPUT_PRIM_COUNTER",
  201. VIVS_MC_PROFILE_CONFIG1_PA_INPUT_PRIM_COUNTER,
  202. &perf_reg_read
  203. },
  204. {
  205. "OUTPUT_PRIM_COUNTER",
  206. VIVS_MC_PROFILE_CONFIG1_PA_OUTPUT_PRIM_COUNTER,
  207. &perf_reg_read
  208. },
  209. {
  210. "DEPTH_CLIPPED_COUNTER",
  211. VIVS_MC_PROFILE_CONFIG1_PA_DEPTH_CLIPPED_COUNTER,
  212. &pipe_reg_read
  213. },
  214. {
  215. "TRIVIAL_REJECTED_COUNTER",
  216. VIVS_MC_PROFILE_CONFIG1_PA_TRIVIAL_REJECTED_COUNTER,
  217. &pipe_reg_read
  218. },
  219. {
  220. "CULLED_COUNTER",
  221. VIVS_MC_PROFILE_CONFIG1_PA_CULLED_COUNTER,
  222. &pipe_reg_read
  223. }
  224. }
  225. },
  226. {
  227. .name = "SE",
  228. .profile_read = VIVS_MC_PROFILE_SE_READ,
  229. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  230. .nr_signals = 2,
  231. .signal = (const struct etnaviv_pm_signal[]) {
  232. {
  233. "CULLED_TRIANGLE_COUNT",
  234. VIVS_MC_PROFILE_CONFIG1_SE_CULLED_TRIANGLE_COUNT,
  235. &perf_reg_read
  236. },
  237. {
  238. "CULLED_LINES_COUNT",
  239. VIVS_MC_PROFILE_CONFIG1_SE_CULLED_LINES_COUNT,
  240. &perf_reg_read
  241. }
  242. }
  243. },
  244. {
  245. .name = "RA",
  246. .profile_read = VIVS_MC_PROFILE_RA_READ,
  247. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  248. .nr_signals = 7,
  249. .signal = (const struct etnaviv_pm_signal[]) {
  250. {
  251. "VALID_PIXEL_COUNT",
  252. VIVS_MC_PROFILE_CONFIG1_RA_VALID_PIXEL_COUNT,
  253. &perf_reg_read
  254. },
  255. {
  256. "TOTAL_QUAD_COUNT",
  257. VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_QUAD_COUNT,
  258. &perf_reg_read
  259. },
  260. {
  261. "VALID_QUAD_COUNT_AFTER_EARLY_Z",
  262. VIVS_MC_PROFILE_CONFIG1_RA_VALID_QUAD_COUNT_AFTER_EARLY_Z,
  263. &perf_reg_read
  264. },
  265. {
  266. "TOTAL_PRIMITIVE_COUNT",
  267. VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_PRIMITIVE_COUNT,
  268. &perf_reg_read
  269. },
  270. {
  271. "PIPE_CACHE_MISS_COUNTER",
  272. VIVS_MC_PROFILE_CONFIG1_RA_PIPE_CACHE_MISS_COUNTER,
  273. &perf_reg_read
  274. },
  275. {
  276. "PREFETCH_CACHE_MISS_COUNTER",
  277. VIVS_MC_PROFILE_CONFIG1_RA_PREFETCH_CACHE_MISS_COUNTER,
  278. &perf_reg_read
  279. },
  280. {
  281. "CULLED_QUAD_COUNT",
  282. VIVS_MC_PROFILE_CONFIG1_RA_CULLED_QUAD_COUNT,
  283. &perf_reg_read
  284. }
  285. }
  286. },
  287. {
  288. .name = "TX",
  289. .profile_read = VIVS_MC_PROFILE_TX_READ,
  290. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  291. .nr_signals = 9,
  292. .signal = (const struct etnaviv_pm_signal[]) {
  293. {
  294. "TOTAL_BILINEAR_REQUESTS",
  295. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_BILINEAR_REQUESTS,
  296. &perf_reg_read
  297. },
  298. {
  299. "TOTAL_TRILINEAR_REQUESTS",
  300. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TRILINEAR_REQUESTS,
  301. &perf_reg_read
  302. },
  303. {
  304. "TOTAL_DISCARDED_TEXTURE_REQUESTS",
  305. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_DISCARDED_TEXTURE_REQUESTS,
  306. &perf_reg_read
  307. },
  308. {
  309. "TOTAL_TEXTURE_REQUESTS",
  310. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TEXTURE_REQUESTS,
  311. &perf_reg_read
  312. },
  313. {
  314. "MEM_READ_COUNT",
  315. VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_COUNT,
  316. &perf_reg_read
  317. },
  318. {
  319. "MEM_READ_IN_8B_COUNT",
  320. VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_IN_8B_COUNT,
  321. &perf_reg_read
  322. },
  323. {
  324. "CACHE_MISS_COUNT",
  325. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_COUNT,
  326. &perf_reg_read
  327. },
  328. {
  329. "CACHE_HIT_TEXEL_COUNT",
  330. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_HIT_TEXEL_COUNT,
  331. &perf_reg_read
  332. },
  333. {
  334. "CACHE_MISS_TEXEL_COUNT",
  335. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_TEXEL_COUNT,
  336. &perf_reg_read
  337. }
  338. }
  339. },
  340. {
  341. .name = "MC",
  342. .profile_read = VIVS_MC_PROFILE_MC_READ,
  343. .profile_config = VIVS_MC_PROFILE_CONFIG2,
  344. .nr_signals = 3,
  345. .signal = (const struct etnaviv_pm_signal[]) {
  346. {
  347. "TOTAL_READ_REQ_8B_FROM_PIPELINE",
  348. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_PIPELINE,
  349. &perf_reg_read
  350. },
  351. {
  352. "TOTAL_READ_REQ_8B_FROM_IP",
  353. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_IP,
  354. &perf_reg_read
  355. },
  356. {
  357. "TOTAL_WRITE_REQ_8B_FROM_PIPELINE",
  358. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_WRITE_REQ_8B_FROM_PIPELINE,
  359. &perf_reg_read
  360. }
  361. }
  362. }
  363. };
  364. static const struct etnaviv_pm_domain doms_2d[] = {
  365. {
  366. .name = "PE",
  367. .profile_read = VIVS_MC_PROFILE_PE_READ,
  368. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  369. .nr_signals = 1,
  370. .signal = (const struct etnaviv_pm_signal[]) {
  371. {
  372. "PIXELS_RENDERED_2D",
  373. VIVS_MC_PROFILE_CONFIG0_PE_PIXELS_RENDERED_2D,
  374. &pipe_reg_read
  375. }
  376. }
  377. }
  378. };
  379. static const struct etnaviv_pm_domain doms_vg[] = {
  380. };
  381. static const struct etnaviv_pm_domain_meta doms_meta[] = {
  382. {
  383. .nr_domains = ARRAY_SIZE(doms_3d),
  384. .domains = &doms_3d[0]
  385. },
  386. {
  387. .nr_domains = ARRAY_SIZE(doms_2d),
  388. .domains = &doms_2d[0]
  389. },
  390. {
  391. .nr_domains = ARRAY_SIZE(doms_vg),
  392. .domains = &doms_vg[0]
  393. }
  394. };
  395. int etnaviv_pm_query_dom(struct etnaviv_gpu *gpu,
  396. struct drm_etnaviv_pm_domain *domain)
  397. {
  398. const struct etnaviv_pm_domain_meta *meta = &doms_meta[domain->pipe];
  399. const struct etnaviv_pm_domain *dom;
  400. if (domain->iter >= meta->nr_domains)
  401. return -EINVAL;
  402. dom = meta->domains + domain->iter;
  403. domain->id = domain->iter;
  404. domain->nr_signals = dom->nr_signals;
  405. strncpy(domain->name, dom->name, sizeof(domain->name));
  406. domain->iter++;
  407. if (domain->iter == meta->nr_domains)
  408. domain->iter = 0xff;
  409. return 0;
  410. }
  411. int etnaviv_pm_query_sig(struct etnaviv_gpu *gpu,
  412. struct drm_etnaviv_pm_signal *signal)
  413. {
  414. const struct etnaviv_pm_domain_meta *meta = &doms_meta[signal->pipe];
  415. const struct etnaviv_pm_domain *dom;
  416. const struct etnaviv_pm_signal *sig;
  417. if (signal->domain >= meta->nr_domains)
  418. return -EINVAL;
  419. dom = meta->domains + signal->domain;
  420. if (signal->iter > dom->nr_signals)
  421. return -EINVAL;
  422. sig = &dom->signal[signal->iter];
  423. signal->id = signal->iter;
  424. strncpy(signal->name, sig->name, sizeof(signal->name));
  425. signal->iter++;
  426. if (signal->iter == dom->nr_signals)
  427. signal->iter = 0xffff;
  428. return 0;
  429. }
  430. int etnaviv_pm_req_validate(const struct drm_etnaviv_gem_submit_pmr *r,
  431. u32 exec_state)
  432. {
  433. const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
  434. const struct etnaviv_pm_domain *dom;
  435. if (r->domain >= meta->nr_domains)
  436. return -EINVAL;
  437. dom = meta->domains + r->domain;
  438. if (r->signal > dom->nr_signals)
  439. return -EINVAL;
  440. return 0;
  441. }
  442. void etnaviv_perfmon_process(struct etnaviv_gpu *gpu,
  443. const struct etnaviv_perfmon_request *pmr, u32 exec_state)
  444. {
  445. const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
  446. const struct etnaviv_pm_domain *dom;
  447. const struct etnaviv_pm_signal *sig;
  448. u32 *bo = pmr->bo_vma;
  449. u32 val;
  450. dom = meta->domains + pmr->domain;
  451. sig = &dom->signal[pmr->signal];
  452. val = sig->sample(gpu, dom, sig);
  453. *(bo + pmr->offset) = val;
  454. }