etnaviv_perfmon.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Copyright (C) 2017 Etnaviv Project
  4. * Copyright (C) 2017 Zodiac Inflight Innovations
  5. */
  6. #include "common.xml.h"
  7. #include "etnaviv_gpu.h"
  8. #include "etnaviv_perfmon.h"
  9. #include "state_hi.xml.h"
  10. struct etnaviv_pm_domain;
  11. struct etnaviv_pm_signal {
  12. char name[64];
  13. u32 data;
  14. u32 (*sample)(struct etnaviv_gpu *gpu,
  15. const struct etnaviv_pm_domain *domain,
  16. const struct etnaviv_pm_signal *signal);
  17. };
  18. struct etnaviv_pm_domain {
  19. char name[64];
  20. /* profile register */
  21. u32 profile_read;
  22. u32 profile_config;
  23. u8 nr_signals;
  24. const struct etnaviv_pm_signal *signal;
  25. };
  26. struct etnaviv_pm_domain_meta {
  27. unsigned int feature;
  28. const struct etnaviv_pm_domain *domains;
  29. u32 nr_domains;
  30. };
  31. static u32 perf_reg_read(struct etnaviv_gpu *gpu,
  32. const struct etnaviv_pm_domain *domain,
  33. const struct etnaviv_pm_signal *signal)
  34. {
  35. gpu_write(gpu, domain->profile_config, signal->data);
  36. return gpu_read(gpu, domain->profile_read);
  37. }
  38. static u32 pipe_reg_read(struct etnaviv_gpu *gpu,
  39. const struct etnaviv_pm_domain *domain,
  40. const struct etnaviv_pm_signal *signal)
  41. {
  42. u32 clock = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
  43. u32 value = 0;
  44. unsigned i;
  45. for (i = 0; i < gpu->identity.pixel_pipes; i++) {
  46. clock &= ~(VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE__MASK);
  47. clock |= VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE(i);
  48. gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, clock);
  49. gpu_write(gpu, domain->profile_config, signal->data);
  50. value += gpu_read(gpu, domain->profile_read);
  51. }
  52. /* switch back to pixel pipe 0 to prevent GPU hang */
  53. clock &= ~(VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE__MASK);
  54. clock |= VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE(0);
  55. gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, clock);
  56. return value;
  57. }
  58. static u32 hi_total_cycle_read(struct etnaviv_gpu *gpu,
  59. const struct etnaviv_pm_domain *domain,
  60. const struct etnaviv_pm_signal *signal)
  61. {
  62. u32 reg = VIVS_HI_PROFILE_TOTAL_CYCLES;
  63. if (gpu->identity.model == chipModel_GC880 ||
  64. gpu->identity.model == chipModel_GC2000 ||
  65. gpu->identity.model == chipModel_GC2100)
  66. reg = VIVS_MC_PROFILE_CYCLE_COUNTER;
  67. return gpu_read(gpu, reg);
  68. }
  69. static u32 hi_total_idle_cycle_read(struct etnaviv_gpu *gpu,
  70. const struct etnaviv_pm_domain *domain,
  71. const struct etnaviv_pm_signal *signal)
  72. {
  73. u32 reg = VIVS_HI_PROFILE_IDLE_CYCLES;
  74. if (gpu->identity.model == chipModel_GC880 ||
  75. gpu->identity.model == chipModel_GC2000 ||
  76. gpu->identity.model == chipModel_GC2100)
  77. reg = VIVS_HI_PROFILE_TOTAL_CYCLES;
  78. return gpu_read(gpu, reg);
  79. }
  80. static const struct etnaviv_pm_domain doms_3d[] = {
  81. {
  82. .name = "HI",
  83. .profile_read = VIVS_MC_PROFILE_HI_READ,
  84. .profile_config = VIVS_MC_PROFILE_CONFIG2,
  85. .nr_signals = 5,
  86. .signal = (const struct etnaviv_pm_signal[]) {
  87. {
  88. "TOTAL_CYCLES",
  89. 0,
  90. &hi_total_cycle_read
  91. },
  92. {
  93. "IDLE_CYCLES",
  94. 0,
  95. &hi_total_idle_cycle_read
  96. },
  97. {
  98. "AXI_CYCLES_READ_REQUEST_STALLED",
  99. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_READ_REQUEST_STALLED,
  100. &perf_reg_read
  101. },
  102. {
  103. "AXI_CYCLES_WRITE_REQUEST_STALLED",
  104. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_REQUEST_STALLED,
  105. &perf_reg_read
  106. },
  107. {
  108. "AXI_CYCLES_WRITE_DATA_STALLED",
  109. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_DATA_STALLED,
  110. &perf_reg_read
  111. }
  112. }
  113. },
  114. {
  115. .name = "PE",
  116. .profile_read = VIVS_MC_PROFILE_PE_READ,
  117. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  118. .nr_signals = 4,
  119. .signal = (const struct etnaviv_pm_signal[]) {
  120. {
  121. "PIXEL_COUNT_KILLED_BY_COLOR_PIPE",
  122. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_COLOR_PIPE,
  123. &pipe_reg_read
  124. },
  125. {
  126. "PIXEL_COUNT_KILLED_BY_DEPTH_PIPE",
  127. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_DEPTH_PIPE,
  128. &pipe_reg_read
  129. },
  130. {
  131. "PIXEL_COUNT_DRAWN_BY_COLOR_PIPE",
  132. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_COLOR_PIPE,
  133. &pipe_reg_read
  134. },
  135. {
  136. "PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE",
  137. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE,
  138. &pipe_reg_read
  139. }
  140. }
  141. },
  142. {
  143. .name = "SH",
  144. .profile_read = VIVS_MC_PROFILE_SH_READ,
  145. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  146. .nr_signals = 9,
  147. .signal = (const struct etnaviv_pm_signal[]) {
  148. {
  149. "SHADER_CYCLES",
  150. VIVS_MC_PROFILE_CONFIG0_SH_SHADER_CYCLES,
  151. &perf_reg_read
  152. },
  153. {
  154. "PS_INST_COUNTER",
  155. VIVS_MC_PROFILE_CONFIG0_SH_PS_INST_COUNTER,
  156. &perf_reg_read
  157. },
  158. {
  159. "RENDERED_PIXEL_COUNTER",
  160. VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_PIXEL_COUNTER,
  161. &perf_reg_read
  162. },
  163. {
  164. "VS_INST_COUNTER",
  165. VIVS_MC_PROFILE_CONFIG0_SH_VS_INST_COUNTER,
  166. &pipe_reg_read
  167. },
  168. {
  169. "RENDERED_VERTICE_COUNTER",
  170. VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_VERTICE_COUNTER,
  171. &pipe_reg_read
  172. },
  173. {
  174. "VTX_BRANCH_INST_COUNTER",
  175. VIVS_MC_PROFILE_CONFIG0_SH_VTX_BRANCH_INST_COUNTER,
  176. &pipe_reg_read
  177. },
  178. {
  179. "VTX_TEXLD_INST_COUNTER",
  180. VIVS_MC_PROFILE_CONFIG0_SH_VTX_TEXLD_INST_COUNTER,
  181. &pipe_reg_read
  182. },
  183. {
  184. "PXL_BRANCH_INST_COUNTER",
  185. VIVS_MC_PROFILE_CONFIG0_SH_PXL_BRANCH_INST_COUNTER,
  186. &pipe_reg_read
  187. },
  188. {
  189. "PXL_TEXLD_INST_COUNTER",
  190. VIVS_MC_PROFILE_CONFIG0_SH_PXL_TEXLD_INST_COUNTER,
  191. &pipe_reg_read
  192. }
  193. }
  194. },
  195. {
  196. .name = "PA",
  197. .profile_read = VIVS_MC_PROFILE_PA_READ,
  198. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  199. .nr_signals = 6,
  200. .signal = (const struct etnaviv_pm_signal[]) {
  201. {
  202. "INPUT_VTX_COUNTER",
  203. VIVS_MC_PROFILE_CONFIG1_PA_INPUT_VTX_COUNTER,
  204. &perf_reg_read
  205. },
  206. {
  207. "INPUT_PRIM_COUNTER",
  208. VIVS_MC_PROFILE_CONFIG1_PA_INPUT_PRIM_COUNTER,
  209. &perf_reg_read
  210. },
  211. {
  212. "OUTPUT_PRIM_COUNTER",
  213. VIVS_MC_PROFILE_CONFIG1_PA_OUTPUT_PRIM_COUNTER,
  214. &perf_reg_read
  215. },
  216. {
  217. "DEPTH_CLIPPED_COUNTER",
  218. VIVS_MC_PROFILE_CONFIG1_PA_DEPTH_CLIPPED_COUNTER,
  219. &pipe_reg_read
  220. },
  221. {
  222. "TRIVIAL_REJECTED_COUNTER",
  223. VIVS_MC_PROFILE_CONFIG1_PA_TRIVIAL_REJECTED_COUNTER,
  224. &pipe_reg_read
  225. },
  226. {
  227. "CULLED_COUNTER",
  228. VIVS_MC_PROFILE_CONFIG1_PA_CULLED_COUNTER,
  229. &pipe_reg_read
  230. }
  231. }
  232. },
  233. {
  234. .name = "SE",
  235. .profile_read = VIVS_MC_PROFILE_SE_READ,
  236. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  237. .nr_signals = 2,
  238. .signal = (const struct etnaviv_pm_signal[]) {
  239. {
  240. "CULLED_TRIANGLE_COUNT",
  241. VIVS_MC_PROFILE_CONFIG1_SE_CULLED_TRIANGLE_COUNT,
  242. &perf_reg_read
  243. },
  244. {
  245. "CULLED_LINES_COUNT",
  246. VIVS_MC_PROFILE_CONFIG1_SE_CULLED_LINES_COUNT,
  247. &perf_reg_read
  248. }
  249. }
  250. },
  251. {
  252. .name = "RA",
  253. .profile_read = VIVS_MC_PROFILE_RA_READ,
  254. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  255. .nr_signals = 7,
  256. .signal = (const struct etnaviv_pm_signal[]) {
  257. {
  258. "VALID_PIXEL_COUNT",
  259. VIVS_MC_PROFILE_CONFIG1_RA_VALID_PIXEL_COUNT,
  260. &perf_reg_read
  261. },
  262. {
  263. "TOTAL_QUAD_COUNT",
  264. VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_QUAD_COUNT,
  265. &perf_reg_read
  266. },
  267. {
  268. "VALID_QUAD_COUNT_AFTER_EARLY_Z",
  269. VIVS_MC_PROFILE_CONFIG1_RA_VALID_QUAD_COUNT_AFTER_EARLY_Z,
  270. &perf_reg_read
  271. },
  272. {
  273. "TOTAL_PRIMITIVE_COUNT",
  274. VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_PRIMITIVE_COUNT,
  275. &perf_reg_read
  276. },
  277. {
  278. "PIPE_CACHE_MISS_COUNTER",
  279. VIVS_MC_PROFILE_CONFIG1_RA_PIPE_CACHE_MISS_COUNTER,
  280. &perf_reg_read
  281. },
  282. {
  283. "PREFETCH_CACHE_MISS_COUNTER",
  284. VIVS_MC_PROFILE_CONFIG1_RA_PREFETCH_CACHE_MISS_COUNTER,
  285. &perf_reg_read
  286. },
  287. {
  288. "CULLED_QUAD_COUNT",
  289. VIVS_MC_PROFILE_CONFIG1_RA_CULLED_QUAD_COUNT,
  290. &perf_reg_read
  291. }
  292. }
  293. },
  294. {
  295. .name = "TX",
  296. .profile_read = VIVS_MC_PROFILE_TX_READ,
  297. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  298. .nr_signals = 9,
  299. .signal = (const struct etnaviv_pm_signal[]) {
  300. {
  301. "TOTAL_BILINEAR_REQUESTS",
  302. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_BILINEAR_REQUESTS,
  303. &perf_reg_read
  304. },
  305. {
  306. "TOTAL_TRILINEAR_REQUESTS",
  307. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TRILINEAR_REQUESTS,
  308. &perf_reg_read
  309. },
  310. {
  311. "TOTAL_DISCARDED_TEXTURE_REQUESTS",
  312. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_DISCARDED_TEXTURE_REQUESTS,
  313. &perf_reg_read
  314. },
  315. {
  316. "TOTAL_TEXTURE_REQUESTS",
  317. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TEXTURE_REQUESTS,
  318. &perf_reg_read
  319. },
  320. {
  321. "MEM_READ_COUNT",
  322. VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_COUNT,
  323. &perf_reg_read
  324. },
  325. {
  326. "MEM_READ_IN_8B_COUNT",
  327. VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_IN_8B_COUNT,
  328. &perf_reg_read
  329. },
  330. {
  331. "CACHE_MISS_COUNT",
  332. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_COUNT,
  333. &perf_reg_read
  334. },
  335. {
  336. "CACHE_HIT_TEXEL_COUNT",
  337. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_HIT_TEXEL_COUNT,
  338. &perf_reg_read
  339. },
  340. {
  341. "CACHE_MISS_TEXEL_COUNT",
  342. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_TEXEL_COUNT,
  343. &perf_reg_read
  344. }
  345. }
  346. },
  347. {
  348. .name = "MC",
  349. .profile_read = VIVS_MC_PROFILE_MC_READ,
  350. .profile_config = VIVS_MC_PROFILE_CONFIG2,
  351. .nr_signals = 3,
  352. .signal = (const struct etnaviv_pm_signal[]) {
  353. {
  354. "TOTAL_READ_REQ_8B_FROM_PIPELINE",
  355. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_PIPELINE,
  356. &perf_reg_read
  357. },
  358. {
  359. "TOTAL_READ_REQ_8B_FROM_IP",
  360. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_IP,
  361. &perf_reg_read
  362. },
  363. {
  364. "TOTAL_WRITE_REQ_8B_FROM_PIPELINE",
  365. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_WRITE_REQ_8B_FROM_PIPELINE,
  366. &perf_reg_read
  367. }
  368. }
  369. }
  370. };
  371. static const struct etnaviv_pm_domain doms_2d[] = {
  372. {
  373. .name = "PE",
  374. .profile_read = VIVS_MC_PROFILE_PE_READ,
  375. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  376. .nr_signals = 1,
  377. .signal = (const struct etnaviv_pm_signal[]) {
  378. {
  379. "PIXELS_RENDERED_2D",
  380. VIVS_MC_PROFILE_CONFIG0_PE_PIXELS_RENDERED_2D,
  381. &pipe_reg_read
  382. }
  383. }
  384. }
  385. };
  386. static const struct etnaviv_pm_domain doms_vg[] = {
  387. };
  388. static const struct etnaviv_pm_domain_meta doms_meta[] = {
  389. {
  390. .feature = chipFeatures_PIPE_3D,
  391. .nr_domains = ARRAY_SIZE(doms_3d),
  392. .domains = &doms_3d[0]
  393. },
  394. {
  395. .feature = chipFeatures_PIPE_2D,
  396. .nr_domains = ARRAY_SIZE(doms_2d),
  397. .domains = &doms_2d[0]
  398. },
  399. {
  400. .feature = chipFeatures_PIPE_VG,
  401. .nr_domains = ARRAY_SIZE(doms_vg),
  402. .domains = &doms_vg[0]
  403. }
  404. };
  405. static unsigned int num_pm_domains(const struct etnaviv_gpu *gpu)
  406. {
  407. unsigned int num = 0, i;
  408. for (i = 0; i < ARRAY_SIZE(doms_meta); i++) {
  409. const struct etnaviv_pm_domain_meta *meta = &doms_meta[i];
  410. if (gpu->identity.features & meta->feature)
  411. num += meta->nr_domains;
  412. }
  413. return num;
  414. }
  415. static const struct etnaviv_pm_domain *pm_domain(const struct etnaviv_gpu *gpu,
  416. unsigned int index)
  417. {
  418. const struct etnaviv_pm_domain *domain = NULL;
  419. unsigned int offset = 0, i;
  420. for (i = 0; i < ARRAY_SIZE(doms_meta); i++) {
  421. const struct etnaviv_pm_domain_meta *meta = &doms_meta[i];
  422. if (!(gpu->identity.features & meta->feature))
  423. continue;
  424. if (index - offset >= meta->nr_domains) {
  425. offset += meta->nr_domains;
  426. continue;
  427. }
  428. domain = meta->domains + (index - offset);
  429. }
  430. return domain;
  431. }
  432. int etnaviv_pm_query_dom(struct etnaviv_gpu *gpu,
  433. struct drm_etnaviv_pm_domain *domain)
  434. {
  435. const unsigned int nr_domains = num_pm_domains(gpu);
  436. const struct etnaviv_pm_domain *dom;
  437. if (domain->iter >= nr_domains)
  438. return -EINVAL;
  439. dom = pm_domain(gpu, domain->iter);
  440. if (!dom)
  441. return -EINVAL;
  442. domain->id = domain->iter;
  443. domain->nr_signals = dom->nr_signals;
  444. strncpy(domain->name, dom->name, sizeof(domain->name));
  445. domain->iter++;
  446. if (domain->iter == nr_domains)
  447. domain->iter = 0xff;
  448. return 0;
  449. }
  450. int etnaviv_pm_query_sig(struct etnaviv_gpu *gpu,
  451. struct drm_etnaviv_pm_signal *signal)
  452. {
  453. const unsigned int nr_domains = num_pm_domains(gpu);
  454. const struct etnaviv_pm_domain *dom;
  455. const struct etnaviv_pm_signal *sig;
  456. if (signal->domain >= nr_domains)
  457. return -EINVAL;
  458. dom = pm_domain(gpu, signal->domain);
  459. if (!dom)
  460. return -EINVAL;
  461. if (signal->iter >= dom->nr_signals)
  462. return -EINVAL;
  463. sig = &dom->signal[signal->iter];
  464. signal->id = signal->iter;
  465. strncpy(signal->name, sig->name, sizeof(signal->name));
  466. signal->iter++;
  467. if (signal->iter == dom->nr_signals)
  468. signal->iter = 0xffff;
  469. return 0;
  470. }
  471. int etnaviv_pm_req_validate(const struct drm_etnaviv_gem_submit_pmr *r,
  472. u32 exec_state)
  473. {
  474. const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
  475. const struct etnaviv_pm_domain *dom;
  476. if (r->domain >= meta->nr_domains)
  477. return -EINVAL;
  478. dom = meta->domains + r->domain;
  479. if (r->signal >= dom->nr_signals)
  480. return -EINVAL;
  481. return 0;
  482. }
  483. void etnaviv_perfmon_process(struct etnaviv_gpu *gpu,
  484. const struct etnaviv_perfmon_request *pmr, u32 exec_state)
  485. {
  486. const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
  487. const struct etnaviv_pm_domain *dom;
  488. const struct etnaviv_pm_signal *sig;
  489. u32 *bo = pmr->bo_vma;
  490. u32 val;
  491. dom = meta->domains + pmr->domain;
  492. sig = &dom->signal[pmr->signal];
  493. val = sig->sample(gpu, dom, sig);
  494. *(bo + pmr->offset) = val;
  495. }