1 // SPDX-License-Identifier: GPL-2.0
3 * Copyright (C) 2017 Etnaviv Project
4 * Copyright (C) 2017 Zodiac Inflight Innovations
7 #include "common.xml.h"
8 #include "etnaviv_gpu.h"
9 #include "etnaviv_perfmon.h"
10 #include "state_hi.xml.h"
12 struct etnaviv_pm_domain;
14 struct etnaviv_pm_signal {
18 u32 (*sample)(struct etnaviv_gpu *gpu,
19 const struct etnaviv_pm_domain *domain,
20 const struct etnaviv_pm_signal *signal);
23 struct etnaviv_pm_domain {
26 /* profile register */
31 const struct etnaviv_pm_signal *signal;
34 struct etnaviv_pm_domain_meta {
36 const struct etnaviv_pm_domain *domains;
40 static u32 perf_reg_read(struct etnaviv_gpu *gpu,
41 const struct etnaviv_pm_domain *domain,
42 const struct etnaviv_pm_signal *signal)
44 gpu_write(gpu, domain->profile_config, signal->data);
46 return gpu_read(gpu, domain->profile_read);
49 static inline void pipe_select(struct etnaviv_gpu *gpu, u32 clock, unsigned pipe)
51 clock &= ~(VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE__MASK);
52 clock |= VIVS_HI_CLOCK_CONTROL_DEBUG_PIXEL_PIPE(pipe);
54 gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, clock);
57 static u32 pipe_perf_reg_read(struct etnaviv_gpu *gpu,
58 const struct etnaviv_pm_domain *domain,
59 const struct etnaviv_pm_signal *signal)
61 u32 clock = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
65 lockdep_assert_held(&gpu->lock);
67 for (i = 0; i < gpu->identity.pixel_pipes; i++) {
68 pipe_select(gpu, clock, i);
69 value += perf_reg_read(gpu, domain, signal);
72 /* switch back to pixel pipe 0 to prevent GPU hang */
73 pipe_select(gpu, clock, 0);
78 static u32 pipe_reg_read(struct etnaviv_gpu *gpu,
79 const struct etnaviv_pm_domain *domain,
80 const struct etnaviv_pm_signal *signal)
82 u32 clock = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
86 lockdep_assert_held(&gpu->lock);
88 for (i = 0; i < gpu->identity.pixel_pipes; i++) {
89 pipe_select(gpu, clock, i);
90 value += gpu_read(gpu, signal->data);
93 /* switch back to pixel pipe 0 to prevent GPU hang */
94 pipe_select(gpu, clock, 0);
99 static u32 hi_total_cycle_read(struct etnaviv_gpu *gpu,
100 const struct etnaviv_pm_domain *domain,
101 const struct etnaviv_pm_signal *signal)
103 u32 reg = VIVS_HI_PROFILE_TOTAL_CYCLES;
105 if (gpu->identity.model == chipModel_GC880 ||
106 gpu->identity.model == chipModel_GC2000 ||
107 gpu->identity.model == chipModel_GC2100)
108 reg = VIVS_MC_PROFILE_CYCLE_COUNTER;
110 return gpu_read(gpu, reg);
113 static u32 hi_total_idle_cycle_read(struct etnaviv_gpu *gpu,
114 const struct etnaviv_pm_domain *domain,
115 const struct etnaviv_pm_signal *signal)
117 u32 reg = VIVS_HI_PROFILE_IDLE_CYCLES;
119 if (gpu->identity.model == chipModel_GC880 ||
120 gpu->identity.model == chipModel_GC2000 ||
121 gpu->identity.model == chipModel_GC2100)
122 reg = VIVS_HI_PROFILE_TOTAL_CYCLES;
124 return gpu_read(gpu, reg);
127 static const struct etnaviv_pm_domain doms_3d[] = {
130 .profile_read = VIVS_MC_PROFILE_HI_READ,
131 .profile_config = VIVS_MC_PROFILE_CONFIG2,
133 .signal = (const struct etnaviv_pm_signal[]) {
136 VIVS_HI_PROFILE_READ_BYTES8,
140 "TOTAL_WRITE_BYTES8",
141 VIVS_HI_PROFILE_WRITE_BYTES8,
152 &hi_total_idle_cycle_read
155 "AXI_CYCLES_READ_REQUEST_STALLED",
156 VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_READ_REQUEST_STALLED,
160 "AXI_CYCLES_WRITE_REQUEST_STALLED",
161 VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_REQUEST_STALLED,
165 "AXI_CYCLES_WRITE_DATA_STALLED",
166 VIVS_MC_PROFILE_CONFIG2_HI_AXI_CYCLES_WRITE_DATA_STALLED,
173 .profile_read = VIVS_MC_PROFILE_PE_READ,
174 .profile_config = VIVS_MC_PROFILE_CONFIG0,
176 .signal = (const struct etnaviv_pm_signal[]) {
178 "PIXEL_COUNT_KILLED_BY_COLOR_PIPE",
179 VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_COLOR_PIPE,
183 "PIXEL_COUNT_KILLED_BY_DEPTH_PIPE",
184 VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_KILLED_BY_DEPTH_PIPE,
188 "PIXEL_COUNT_DRAWN_BY_COLOR_PIPE",
189 VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_COLOR_PIPE,
193 "PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE",
194 VIVS_MC_PROFILE_CONFIG0_PE_PIXEL_COUNT_DRAWN_BY_DEPTH_PIPE,
201 .profile_read = VIVS_MC_PROFILE_SH_READ,
202 .profile_config = VIVS_MC_PROFILE_CONFIG0,
204 .signal = (const struct etnaviv_pm_signal[]) {
207 VIVS_MC_PROFILE_CONFIG0_SH_SHADER_CYCLES,
212 VIVS_MC_PROFILE_CONFIG0_SH_PS_INST_COUNTER,
216 "RENDERED_PIXEL_COUNTER",
217 VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_PIXEL_COUNTER,
222 VIVS_MC_PROFILE_CONFIG0_SH_VS_INST_COUNTER,
226 "RENDERED_VERTICE_COUNTER",
227 VIVS_MC_PROFILE_CONFIG0_SH_RENDERED_VERTICE_COUNTER,
231 "VTX_BRANCH_INST_COUNTER",
232 VIVS_MC_PROFILE_CONFIG0_SH_VTX_BRANCH_INST_COUNTER,
236 "VTX_TEXLD_INST_COUNTER",
237 VIVS_MC_PROFILE_CONFIG0_SH_VTX_TEXLD_INST_COUNTER,
241 "PXL_BRANCH_INST_COUNTER",
242 VIVS_MC_PROFILE_CONFIG0_SH_PXL_BRANCH_INST_COUNTER,
246 "PXL_TEXLD_INST_COUNTER",
247 VIVS_MC_PROFILE_CONFIG0_SH_PXL_TEXLD_INST_COUNTER,
254 .profile_read = VIVS_MC_PROFILE_PA_READ,
255 .profile_config = VIVS_MC_PROFILE_CONFIG1,
257 .signal = (const struct etnaviv_pm_signal[]) {
260 VIVS_MC_PROFILE_CONFIG1_PA_INPUT_VTX_COUNTER,
264 "INPUT_PRIM_COUNTER",
265 VIVS_MC_PROFILE_CONFIG1_PA_INPUT_PRIM_COUNTER,
269 "OUTPUT_PRIM_COUNTER",
270 VIVS_MC_PROFILE_CONFIG1_PA_OUTPUT_PRIM_COUNTER,
274 "DEPTH_CLIPPED_COUNTER",
275 VIVS_MC_PROFILE_CONFIG1_PA_DEPTH_CLIPPED_COUNTER,
279 "TRIVIAL_REJECTED_COUNTER",
280 VIVS_MC_PROFILE_CONFIG1_PA_TRIVIAL_REJECTED_COUNTER,
285 VIVS_MC_PROFILE_CONFIG1_PA_CULLED_COUNTER,
292 .profile_read = VIVS_MC_PROFILE_SE_READ,
293 .profile_config = VIVS_MC_PROFILE_CONFIG1,
295 .signal = (const struct etnaviv_pm_signal[]) {
297 "CULLED_TRIANGLE_COUNT",
298 VIVS_MC_PROFILE_CONFIG1_SE_CULLED_TRIANGLE_COUNT,
302 "CULLED_LINES_COUNT",
303 VIVS_MC_PROFILE_CONFIG1_SE_CULLED_LINES_COUNT,
310 .profile_read = VIVS_MC_PROFILE_RA_READ,
311 .profile_config = VIVS_MC_PROFILE_CONFIG1,
313 .signal = (const struct etnaviv_pm_signal[]) {
316 VIVS_MC_PROFILE_CONFIG1_RA_VALID_PIXEL_COUNT,
321 VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_QUAD_COUNT,
325 "VALID_QUAD_COUNT_AFTER_EARLY_Z",
326 VIVS_MC_PROFILE_CONFIG1_RA_VALID_QUAD_COUNT_AFTER_EARLY_Z,
330 "TOTAL_PRIMITIVE_COUNT",
331 VIVS_MC_PROFILE_CONFIG1_RA_TOTAL_PRIMITIVE_COUNT,
335 "PIPE_CACHE_MISS_COUNTER",
336 VIVS_MC_PROFILE_CONFIG1_RA_PIPE_CACHE_MISS_COUNTER,
340 "PREFETCH_CACHE_MISS_COUNTER",
341 VIVS_MC_PROFILE_CONFIG1_RA_PREFETCH_CACHE_MISS_COUNTER,
346 VIVS_MC_PROFILE_CONFIG1_RA_CULLED_QUAD_COUNT,
353 .profile_read = VIVS_MC_PROFILE_TX_READ,
354 .profile_config = VIVS_MC_PROFILE_CONFIG1,
356 .signal = (const struct etnaviv_pm_signal[]) {
358 "TOTAL_BILINEAR_REQUESTS",
359 VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_BILINEAR_REQUESTS,
363 "TOTAL_TRILINEAR_REQUESTS",
364 VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TRILINEAR_REQUESTS,
368 "TOTAL_DISCARDED_TEXTURE_REQUESTS",
369 VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_DISCARDED_TEXTURE_REQUESTS,
373 "TOTAL_TEXTURE_REQUESTS",
374 VIVS_MC_PROFILE_CONFIG1_TX_TOTAL_TEXTURE_REQUESTS,
379 VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_COUNT,
383 "MEM_READ_IN_8B_COUNT",
384 VIVS_MC_PROFILE_CONFIG1_TX_MEM_READ_IN_8B_COUNT,
389 VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_COUNT,
393 "CACHE_HIT_TEXEL_COUNT",
394 VIVS_MC_PROFILE_CONFIG1_TX_CACHE_HIT_TEXEL_COUNT,
398 "CACHE_MISS_TEXEL_COUNT",
399 VIVS_MC_PROFILE_CONFIG1_TX_CACHE_MISS_TEXEL_COUNT,
406 .profile_read = VIVS_MC_PROFILE_MC_READ,
407 .profile_config = VIVS_MC_PROFILE_CONFIG2,
409 .signal = (const struct etnaviv_pm_signal[]) {
411 "TOTAL_READ_REQ_8B_FROM_PIPELINE",
412 VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_PIPELINE,
416 "TOTAL_READ_REQ_8B_FROM_IP",
417 VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_READ_REQ_8B_FROM_IP,
421 "TOTAL_WRITE_REQ_8B_FROM_PIPELINE",
422 VIVS_MC_PROFILE_CONFIG2_MC_TOTAL_WRITE_REQ_8B_FROM_PIPELINE,
429 static const struct etnaviv_pm_domain doms_2d[] = {
432 .profile_read = VIVS_MC_PROFILE_PE_READ,
433 .profile_config = VIVS_MC_PROFILE_CONFIG0,
435 .signal = (const struct etnaviv_pm_signal[]) {
437 "PIXELS_RENDERED_2D",
438 VIVS_MC_PROFILE_CONFIG0_PE_PIXELS_RENDERED_2D,
445 static const struct etnaviv_pm_domain doms_vg[] = {
448 static const struct etnaviv_pm_domain_meta doms_meta[] = {
450 .feature = chipFeatures_PIPE_3D,
451 .nr_domains = ARRAY_SIZE(doms_3d),
452 .domains = &doms_3d[0]
455 .feature = chipFeatures_PIPE_2D,
456 .nr_domains = ARRAY_SIZE(doms_2d),
457 .domains = &doms_2d[0]
460 .feature = chipFeatures_PIPE_VG,
461 .nr_domains = ARRAY_SIZE(doms_vg),
462 .domains = &doms_vg[0]
466 static unsigned int num_pm_domains(const struct etnaviv_gpu *gpu)
468 unsigned int num = 0, i;
470 for (i = 0; i < ARRAY_SIZE(doms_meta); i++) {
471 const struct etnaviv_pm_domain_meta *meta = &doms_meta[i];
473 if (gpu->identity.features & meta->feature)
474 num += meta->nr_domains;
480 static const struct etnaviv_pm_domain *pm_domain(const struct etnaviv_gpu *gpu,
483 const struct etnaviv_pm_domain *domain = NULL;
484 unsigned int offset = 0, i;
486 for (i = 0; i < ARRAY_SIZE(doms_meta); i++) {
487 const struct etnaviv_pm_domain_meta *meta = &doms_meta[i];
489 if (!(gpu->identity.features & meta->feature))
492 if (index - offset >= meta->nr_domains) {
493 offset += meta->nr_domains;
497 domain = meta->domains + (index - offset);
503 int etnaviv_pm_query_dom(struct etnaviv_gpu *gpu,
504 struct drm_etnaviv_pm_domain *domain)
506 const unsigned int nr_domains = num_pm_domains(gpu);
507 const struct etnaviv_pm_domain *dom;
509 if (domain->iter >= nr_domains)
512 dom = pm_domain(gpu, domain->iter);
516 domain->id = domain->iter;
517 domain->nr_signals = dom->nr_signals;
518 strscpy_pad(domain->name, dom->name, sizeof(domain->name));
521 if (domain->iter == nr_domains)
527 int etnaviv_pm_query_sig(struct etnaviv_gpu *gpu,
528 struct drm_etnaviv_pm_signal *signal)
530 const unsigned int nr_domains = num_pm_domains(gpu);
531 const struct etnaviv_pm_domain *dom;
532 const struct etnaviv_pm_signal *sig;
534 if (signal->domain >= nr_domains)
537 dom = pm_domain(gpu, signal->domain);
541 if (signal->iter >= dom->nr_signals)
544 sig = &dom->signal[signal->iter];
546 signal->id = signal->iter;
547 strscpy_pad(signal->name, sig->name, sizeof(signal->name));
550 if (signal->iter == dom->nr_signals)
551 signal->iter = 0xffff;
556 int etnaviv_pm_req_validate(const struct drm_etnaviv_gem_submit_pmr *r,
559 const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
560 const struct etnaviv_pm_domain *dom;
562 if (r->domain >= meta->nr_domains)
565 dom = meta->domains + r->domain;
567 if (r->signal >= dom->nr_signals)
573 void etnaviv_perfmon_process(struct etnaviv_gpu *gpu,
574 const struct etnaviv_perfmon_request *pmr, u32 exec_state)
576 const struct etnaviv_pm_domain_meta *meta = &doms_meta[exec_state];
577 const struct etnaviv_pm_domain *dom;
578 const struct etnaviv_pm_signal *sig;
579 u32 *bo = pmr->bo_vma;
582 dom = meta->domains + pmr->domain;
583 sig = &dom->signal[pmr->signal];
584 val = sig->sample(gpu, dom, sig);
586 *(bo + pmr->offset) = val;