etnaviv_perfmon.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Copyright (C) 2017 Etnaviv Project
  4. * Copyright (C) 2017 Zodiac Inflight Innovations
  5. */
  6. #include "common.xml.h"
  7. #include "etnaviv_gpu.h"
  8. #include "etnaviv_perfmon.h"
  9. #include "state_hi.xml.h"
  10. struct etnaviv_pm_domain;
  11. struct etnaviv_pm_signal {
  12. char name[64];
  13. u32 data;
  14. u32 (*sample)(struct etnaviv_gpu *gpu,
  15. const struct etnaviv_pm_domain *domain,
  16. const struct etnaviv_pm_signal *signal);
  17. };
  18. struct etnaviv_pm_domain {
  19. char name[64];
  20. /* profile register */
  21. u32 profile_read;
  22. u32 profile_config;
  23. u8 nr_signals;
  24. const struct etnaviv_pm_signal *signal;
  25. };
  26. struct etnaviv_pm_domain_meta {
  27. unsigned int feature;
  28. const struct etnaviv_pm_domain *domains;
  29. u32 nr_domains;
  30. };
  31. static u32 perf_reg_read(struct etnaviv_gpu *gpu,
  32. const struct etnaviv_pm_domain *domain,
  33. const struct etnaviv_pm_signal *signal)
  34. {
  35. gpu_write(gpu, domain->profile_config, signal->data);
  36. return gpu_read(gpu, domain->profile_read);
  37. }
  38. static inline void pipe_select(struct etnaviv_gpu *gpu, u32 clock, unsigned pipe)
  39. {
  40. clock &= ~(VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE__MASK);
  41. clock |= VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE(pipe);
  42. gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, clock);
  43. }
  44. static u32 pipe_perf_reg_read(struct etnaviv_gpu *gpu,
  45. const struct etnaviv_pm_domain *domain,
  46. const struct etnaviv_pm_signal *signal)
  47. {
  48. u32 clock = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
  49. u32 value = 0;
  50. unsigned i;
  51. lockdep_assert_held(&gpu->lock);
  52. for (i = 0; i < gpu->identity.pixel_pipes; i++) {
  53. pipe_select(gpu, clock, i);
  54. value += perf_reg_read(gpu, domain, signal);
  55. }
  56. /* switch back to pixel pipe 0 to prevent GPU hang */
  57. pipe_select(gpu, clock, 0);
  58. return value;
  59. }
  60. static u32 pipe_reg_read(struct etnaviv_gpu *gpu,
  61. const struct etnaviv_pm_domain *domain,
  62. const struct etnaviv_pm_signal *signal)
  63. {
  64. u32 clock = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
  65. u32 value = 0;
  66. unsigned i;
  67. lockdep_assert_held(&gpu->lock);
  68. for (i = 0; i < gpu->identity.pixel_pipes; i++) {
  69. pipe_select(gpu, clock, i);
  70. value += gpu_read(gpu, signal->data);
  71. }
  72. /* switch back to pixel pipe 0 to prevent GPU hang */
  73. pipe_select(gpu, clock, 0);
  74. return value;
  75. }
  76. static u32 hi_total_cycle_read(struct etnaviv_gpu *gpu,
  77. const struct etnaviv_pm_domain *domain,
  78. const struct etnaviv_pm_signal *signal)
  79. {
  80. u32 reg = VIVS_HI_PROFILE_TOTAL_CYCLES;
  81. if (gpu->identity.model == chipModel_GC880 ||
  82. gpu->identity.model == chipModel_GC2000 ||
  83. gpu->identity.model == chipModel_GC2100)
  84. reg = VIVS_MC_PROFILE_CYCLE_COUNTER;
  85. return gpu_read(gpu, reg);
  86. }
  87. static u32 hi_total_idle_cycle_read(struct etnaviv_gpu *gpu,
  88. const struct etnaviv_pm_domain *domain,
  89. const struct etnaviv_pm_signal *signal)
  90. {
  91. u32 reg = VIVS_HI_PROFILE_IDLE_CYCLES;
  92. if (gpu->identity.model == chipModel_GC880 ||
  93. gpu->identity.model == chipModel_GC2000 ||
  94. gpu->identity.model == chipModel_GC2100)
  95. reg = VIVS_HI_PROFILE_TOTAL_CYCLES;
  96. return gpu_read(gpu, reg);
  97. }
  98. static const struct etnaviv_pm_domain doms_3d[] = {
  99. {
  100. .name = "HI",
  101. .profile_read = VIVS_MC_PROFILE_HI_READ,
  102. .profile_config = VIVS_MC_PROFILE_CONFIG2,
  103. .nr_signals = 7,
  104. .signal = (const struct etnaviv_pm_signal[]) {
  105. {
  106. "TOTAL_READ_BYTES8",
  107. VIVS_HI_PROFILE_READ_BYTES8,
  108. &pipe_reg_read,
  109. },
  110. {
  111. "TOTAL_WRITE_BYTES8",
  112. VIVS_HI_PROFILE_WRITE_BYTES8,
  113. &pipe_reg_read,
  114. },
  115. {
  116. "TOTAL_CYCLES",
  117. 0,
  118. &hi_total_cycle_read
  119. },
  120. {
  121. "IDLE_CYCLES",
  122. 0,
  123. &hi_total_idle_cycle_read
  124. },
  125. {
  126. "AXI_CYCLES_READ_REQUEST_STALLED",
  127. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_READ_REQUEST_STALLED,
  128. &perf_reg_read
  129. },
  130. {
  131. "AXI_CYCLES_WRITE_REQUEST_STALLED",
  132. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_REQUEST_STALLED,
  133. &perf_reg_read
  134. },
  135. {
  136. "AXI_CYCLES_WRITE_DATA_STALLED",
  137. VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_DATA_STALLED,
  138. &perf_reg_read
  139. }
  140. }
  141. },
  142. {
  143. .name = "PE",
  144. .profile_read = VIVS_MC_PROFILE_PE_READ,
  145. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  146. .nr_signals = 4,
  147. .signal = (const struct etnaviv_pm_signal[]) {
  148. {
  149. "PIXEL_COUNT_KILLED_BY_COLOR_PIPE",
  150. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_COLOR_PIPE,
  151. &pipe_perf_reg_read
  152. },
  153. {
  154. "PIXEL_COUNT_KILLED_BY_DEPTH_PIPE",
  155. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_DEPTH_PIPE,
  156. &pipe_perf_reg_read
  157. },
  158. {
  159. "PIXEL_COUNT_DRAWN_BY_COLOR_PIPE",
  160. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_COLOR_PIPE,
  161. &pipe_perf_reg_read
  162. },
  163. {
  164. "PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE",
  165. VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE,
  166. &pipe_perf_reg_read
  167. }
  168. }
  169. },
  170. {
  171. .name = "SH",
  172. .profile_read = VIVS_MC_PROFILE_SH_READ,
  173. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  174. .nr_signals = 9,
  175. .signal = (const struct etnaviv_pm_signal[]) {
  176. {
  177. "SHADER_CYCLES",
  178. VIVS_MC_PROFILE_CONFIG0_SH_SHADER_CYCLES,
  179. &perf_reg_read
  180. },
  181. {
  182. "PS_INST_COUNTER",
  183. VIVS_MC_PROFILE_CONFIG0_SH_PS_INST_COUNTER,
  184. &perf_reg_read
  185. },
  186. {
  187. "RENDERED_PIXEL_COUNTER",
  188. VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_PIXEL_COUNTER,
  189. &perf_reg_read
  190. },
  191. {
  192. "VS_INST_COUNTER",
  193. VIVS_MC_PROFILE_CONFIG0_SH_VS_INST_COUNTER,
  194. &pipe_perf_reg_read
  195. },
  196. {
  197. "RENDERED_VERTICE_COUNTER",
  198. VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_VERTICE_COUNTER,
  199. &pipe_perf_reg_read
  200. },
  201. {
  202. "VTX_BRANCH_INST_COUNTER",
  203. VIVS_MC_PROFILE_CONFIG0_SH_VTX_BRANCH_INST_COUNTER,
  204. &pipe_perf_reg_read
  205. },
  206. {
  207. "VTX_TEXLD_INST_COUNTER",
  208. VIVS_MC_PROFILE_CONFIG0_SH_VTX_TEXLD_INST_COUNTER,
  209. &pipe_perf_reg_read
  210. },
  211. {
  212. "PXL_BRANCH_INST_COUNTER",
  213. VIVS_MC_PROFILE_CONFIG0_SH_PXL_BRANCH_INST_COUNTER,
  214. &pipe_perf_reg_read
  215. },
  216. {
  217. "PXL_TEXLD_INST_COUNTER",
  218. VIVS_MC_PROFILE_CONFIG0_SH_PXL_TEXLD_INST_COUNTER,
  219. &pipe_perf_reg_read
  220. }
  221. }
  222. },
  223. {
  224. .name = "PA",
  225. .profile_read = VIVS_MC_PROFILE_PA_READ,
  226. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  227. .nr_signals = 6,
  228. .signal = (const struct etnaviv_pm_signal[]) {
  229. {
  230. "INPUT_VTX_COUNTER",
  231. VIVS_MC_PROFILE_CONFIG1_PA_INPUT_VTX_COUNTER,
  232. &perf_reg_read
  233. },
  234. {
  235. "INPUT_PRIM_COUNTER",
  236. VIVS_MC_PROFILE_CONFIG1_PA_INPUT_PRIM_COUNTER,
  237. &perf_reg_read
  238. },
  239. {
  240. "OUTPUT_PRIM_COUNTER",
  241. VIVS_MC_PROFILE_CONFIG1_PA_OUTPUT_PRIM_COUNTER,
  242. &perf_reg_read
  243. },
  244. {
  245. "DEPTH_CLIPPED_COUNTER",
  246. VIVS_MC_PROFILE_CONFIG1_PA_DEPTH_CLIPPED_COUNTER,
  247. &pipe_perf_reg_read
  248. },
  249. {
  250. "TRIVIAL_REJECTED_COUNTER",
  251. VIVS_MC_PROFILE_CONFIG1_PA_TRIVIAL_REJECTED_COUNTER,
  252. &pipe_perf_reg_read
  253. },
  254. {
  255. "CULLED_COUNTER",
  256. VIVS_MC_PROFILE_CONFIG1_PA_CULLED_COUNTER,
  257. &pipe_perf_reg_read
  258. }
  259. }
  260. },
  261. {
  262. .name = "SE",
  263. .profile_read = VIVS_MC_PROFILE_SE_READ,
  264. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  265. .nr_signals = 2,
  266. .signal = (const struct etnaviv_pm_signal[]) {
  267. {
  268. "CULLED_TRIANGLE_COUNT",
  269. VIVS_MC_PROFILE_CONFIG1_SE_CULLED_TRIANGLE_COUNT,
  270. &perf_reg_read
  271. },
  272. {
  273. "CULLED_LINES_COUNT",
  274. VIVS_MC_PROFILE_CONFIG1_SE_CULLED_LINES_COUNT,
  275. &perf_reg_read
  276. }
  277. }
  278. },
  279. {
  280. .name = "RA",
  281. .profile_read = VIVS_MC_PROFILE_RA_READ,
  282. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  283. .nr_signals = 7,
  284. .signal = (const struct etnaviv_pm_signal[]) {
  285. {
  286. "VALID_PIXEL_COUNT",
  287. VIVS_MC_PROFILE_CONFIG1_RA_VALID_PIXEL_COUNT,
  288. &perf_reg_read
  289. },
  290. {
  291. "TOTAL_QUAD_COUNT",
  292. VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_QUAD_COUNT,
  293. &perf_reg_read
  294. },
  295. {
  296. "VALID_QUAD_COUNT_AFTER_EARLY_Z",
  297. VIVS_MC_PROFILE_CONFIG1_RA_VALID_QUAD_COUNT_AFTER_EARLY_Z,
  298. &perf_reg_read
  299. },
  300. {
  301. "TOTAL_PRIMITIVE_COUNT",
  302. VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_PRIMITIVE_COUNT,
  303. &perf_reg_read
  304. },
  305. {
  306. "PIPE_CACHE_MISS_COUNTER",
  307. VIVS_MC_PROFILE_CONFIG1_RA_PIPE_CACHE_MISS_COUNTER,
  308. &perf_reg_read
  309. },
  310. {
  311. "PREFETCH_CACHE_MISS_COUNTER",
  312. VIVS_MC_PROFILE_CONFIG1_RA_PREFETCH_CACHE_MISS_COUNTER,
  313. &perf_reg_read
  314. },
  315. {
  316. "CULLED_QUAD_COUNT",
  317. VIVS_MC_PROFILE_CONFIG1_RA_CULLED_QUAD_COUNT,
  318. &perf_reg_read
  319. }
  320. }
  321. },
  322. {
  323. .name = "TX",
  324. .profile_read = VIVS_MC_PROFILE_TX_READ,
  325. .profile_config = VIVS_MC_PROFILE_CONFIG1,
  326. .nr_signals = 9,
  327. .signal = (const struct etnaviv_pm_signal[]) {
  328. {
  329. "TOTAL_BILINEAR_REQUESTS",
  330. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_BILINEAR_REQUESTS,
  331. &perf_reg_read
  332. },
  333. {
  334. "TOTAL_TRILINEAR_REQUESTS",
  335. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TRILINEAR_REQUESTS,
  336. &perf_reg_read
  337. },
  338. {
  339. "TOTAL_DISCARDED_TEXTURE_REQUESTS",
  340. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_DISCARDED_TEXTURE_REQUESTS,
  341. &perf_reg_read
  342. },
  343. {
  344. "TOTAL_TEXTURE_REQUESTS",
  345. VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TEXTURE_REQUESTS,
  346. &perf_reg_read
  347. },
  348. {
  349. "MEM_READ_COUNT",
  350. VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_COUNT,
  351. &perf_reg_read
  352. },
  353. {
  354. "MEM_READ_IN_8B_COUNT",
  355. VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_IN_8B_COUNT,
  356. &perf_reg_read
  357. },
  358. {
  359. "CACHE_MISS_COUNT",
  360. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_COUNT,
  361. &perf_reg_read
  362. },
  363. {
  364. "CACHE_HIT_TEXEL_COUNT",
  365. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_HIT_TEXEL_COUNT,
  366. &perf_reg_read
  367. },
  368. {
  369. "CACHE_MISS_TEXEL_COUNT",
  370. VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_TEXEL_COUNT,
  371. &perf_reg_read
  372. }
  373. }
  374. },
  375. {
  376. .name = "MC",
  377. .profile_read = VIVS_MC_PROFILE_MC_READ,
  378. .profile_config = VIVS_MC_PROFILE_CONFIG2,
  379. .nr_signals = 3,
  380. .signal = (const struct etnaviv_pm_signal[]) {
  381. {
  382. "TOTAL_READ_REQ_8B_FROM_PIPELINE",
  383. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_PIPELINE,
  384. &perf_reg_read
  385. },
  386. {
  387. "TOTAL_READ_REQ_8B_FROM_IP",
  388. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_IP,
  389. &perf_reg_read
  390. },
  391. {
  392. "TOTAL_WRITE_REQ_8B_FROM_PIPELINE",
  393. VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_WRITE_REQ_8B_FROM_PIPELINE,
  394. &perf_reg_read
  395. }
  396. }
  397. }
  398. };
  399. static const struct etnaviv_pm_domain doms_2d[] = {
  400. {
  401. .name = "PE",
  402. .profile_read = VIVS_MC_PROFILE_PE_READ,
  403. .profile_config = VIVS_MC_PROFILE_CONFIG0,
  404. .nr_signals = 1,
  405. .signal = (const struct etnaviv_pm_signal[]) {
  406. {
  407. "PIXELS_RENDERED_2D",
  408. VIVS_MC_PROFILE_CONFIG0_PE_PIXELS_RENDERED_2D,
  409. &pipe_perf_reg_read
  410. }
  411. }
  412. }
  413. };
  414. static const struct etnaviv_pm_domain doms_vg[] = {
  415. };
  416. static const struct etnaviv_pm_domain_meta doms_meta[] = {
  417. {
  418. .feature = chipFeatures_PIPE_3D,
  419. .nr_domains = ARRAY_SIZE(doms_3d),
  420. .domains = &doms_3d[0]
  421. },
  422. {
  423. .feature = chipFeatures_PIPE_2D,
  424. .nr_domains = ARRAY_SIZE(doms_2d),
  425. .domains = &doms_2d[0]
  426. },
  427. {
  428. .feature = chipFeatures_PIPE_VG,
  429. .nr_domains = ARRAY_SIZE(doms_vg),
  430. .domains = &doms_vg[0]
  431. }
  432. };
  433. static unsigned int num_pm_domains(const struct etnaviv_gpu *gpu)
  434. {
  435. unsigned int num = 0, i;
  436. for (i = 0; i < ARRAY_SIZE(doms_meta); i++) {
  437. const struct etnaviv_pm_domain_meta *meta = &doms_meta[i];
  438. if (gpu->identity.features & meta->feature)
  439. num += meta->nr_domains;
  440. }
  441. return num;
  442. }
  443. static const struct etnaviv_pm_domain *pm_domain(const struct etnaviv_gpu *gpu,
  444. unsigned int index)
  445. {
  446. const struct etnaviv_pm_domain *domain = NULL;
  447. unsigned int offset = 0, i;
  448. for (i = 0; i < ARRAY_SIZE(doms_meta); i++) {
  449. const struct etnaviv_pm_domain_meta *meta = &doms_meta[i];
  450. if (!(gpu->identity.features & meta->feature))
  451. continue;
  452. if (index - offset >= meta->nr_domains) {
  453. offset += meta->nr_domains;
  454. continue;
  455. }
  456. domain = meta->domains + (index - offset);
  457. }
  458. return domain;
  459. }
  460. int etnaviv_pm_query_dom(struct etnaviv_gpu *gpu,
  461. struct drm_etnaviv_pm_domain *domain)
  462. {
  463. const unsigned int nr_domains = num_pm_domains(gpu);
  464. const struct etnaviv_pm_domain *dom;
  465. if (domain->iter >= nr_domains)
  466. return -EINVAL;
  467. dom = pm_domain(gpu, domain->iter);
  468. if (!dom)
  469. return -EINVAL;
  470. domain->id = domain->iter;
  471. domain->nr_signals = dom->nr_signals;
  472. strscpy_pad(domain->name, dom->name, sizeof(domain->name));
  473. domain->iter++;
  474. if (domain->iter == nr_domains)
  475. domain->iter = 0xff;
  476. return 0;
  477. }
  478. int etnaviv_pm_query_sig(struct etnaviv_gpu *gpu,
  479. struct drm_etnaviv_pm_signal *signal)
  480. {
  481. const unsigned int nr_domains = num_pm_domains(gpu);
  482. const struct etnaviv_pm_domain *dom;
  483. const struct etnaviv_pm_signal *sig;
  484. if (signal->domain >= nr_domains)
  485. return -EINVAL;
  486. dom = pm_domain(gpu, signal->domain);
  487. if (!dom)
  488. return -EINVAL;
  489. if (signal->iter >= dom->nr_signals)
  490. return -EINVAL;
  491. sig = &dom->signal[signal->iter];
  492. signal->id = signal->iter;
  493. strscpy_pad(signal->name, sig->name, sizeof(signal->name));
  494. signal->iter++;
  495. if (signal->iter == dom->nr_signals)
  496. signal->iter = 0xffff;
  497. return 0;
  498. }
  499. int etnaviv_pm_req_validate(const struct drm_etnaviv_gem_submit_pmr *r,
  500. u32 exec_state)
  501. {
  502. const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
  503. const struct etnaviv_pm_domain *dom;
  504. if (r->domain >= meta->nr_domains)
  505. return -EINVAL;
  506. dom = meta->domains + r->domain;
  507. if (r->signal >= dom->nr_signals)
  508. return -EINVAL;
  509. return 0;
  510. }
  511. void etnaviv_perfmon_process(struct etnaviv_gpu *gpu,
  512. const struct etnaviv_perfmon_request *pmr, u32 exec_state)
  513. {
  514. const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
  515. const struct etnaviv_pm_domain *dom;
  516. const struct etnaviv_pm_signal *sig;
  517. u32 *bo = pmr->bo_vma;
  518. u32 val;
  519. dom = meta->domains + pmr->domain;
  520. sig = &dom->signal[pmr->signal];
  521. val = sig->sample(gpu, dom, sig);
  522. *(bo + pmr->offset) = val;
  523. }