xref: /aosp_15_r20/external/mesa3d/src/freedreno/perfcntrs/fd6_perfcntr.c (revision 6104692788411f58d303aa86923a9ff6ecaded22)
1 /*
2  * Copyright © 2019 Rob Clark <[email protected]>
3  * SPDX-License-Identifier: MIT
4  *
5  * Authors:
6  *    Rob Clark <[email protected]>
7  */
8 
9 #ifndef FD6_PERFCNTR_H_
10 #define FD6_PERFCNTR_H_
11 
12 #include "util/half_float.h"
13 #include "util/u_math.h"
14 #include "adreno_common.xml.h"
15 #include "adreno_pm4.xml.h"
16 #include "a6xx.xml.h"
17 
18 #define REG(_x) REG_A6XX_ ## _x
19 #include "freedreno_perfcntr.h"
20 
21 static const struct fd_perfcntr_counter cp_counters[] = {
22 //RESERVED: for kernel
23 //    COUNTER(CP_PERFCTR_CP_SEL(0),  RBBM_PERFCTR_CP(0),  RBBM_PERFCTR_CP(0)+1),
24       COUNTER(CP_PERFCTR_CP_SEL(1),  RBBM_PERFCTR_CP(1),  RBBM_PERFCTR_CP(1)+1),
25       COUNTER(CP_PERFCTR_CP_SEL(2),  RBBM_PERFCTR_CP(2),  RBBM_PERFCTR_CP(2)+1),
26       COUNTER(CP_PERFCTR_CP_SEL(3),  RBBM_PERFCTR_CP(3),  RBBM_PERFCTR_CP(3)+1),
27       COUNTER(CP_PERFCTR_CP_SEL(4),  RBBM_PERFCTR_CP(4),  RBBM_PERFCTR_CP(4)+1),
28       COUNTER(CP_PERFCTR_CP_SEL(5),  RBBM_PERFCTR_CP(5),  RBBM_PERFCTR_CP(5)+1),
29       COUNTER(CP_PERFCTR_CP_SEL(6),  RBBM_PERFCTR_CP(6),  RBBM_PERFCTR_CP(6)+1),
30       COUNTER(CP_PERFCTR_CP_SEL(7),  RBBM_PERFCTR_CP(7),  RBBM_PERFCTR_CP(7)+1),
31       COUNTER(CP_PERFCTR_CP_SEL(8),  RBBM_PERFCTR_CP(8),  RBBM_PERFCTR_CP(8)+1),
32       COUNTER(CP_PERFCTR_CP_SEL(9),  RBBM_PERFCTR_CP(9),  RBBM_PERFCTR_CP(9)+1),
33       COUNTER(CP_PERFCTR_CP_SEL(10), RBBM_PERFCTR_CP(10), RBBM_PERFCTR_CP(10)+1),
34       COUNTER(CP_PERFCTR_CP_SEL(11), RBBM_PERFCTR_CP(11), RBBM_PERFCTR_CP(11)+1),
35       COUNTER(CP_PERFCTR_CP_SEL(12), RBBM_PERFCTR_CP(12), RBBM_PERFCTR_CP(12)+1),
36       COUNTER(CP_PERFCTR_CP_SEL(13), RBBM_PERFCTR_CP(13), RBBM_PERFCTR_CP(13)+1),
37 };
38 
39 static const struct fd_perfcntr_countable cp_countables[] = {
40       COUNTABLE(PERF_CP_ALWAYS_COUNT, UINT64, AVERAGE),
41       COUNTABLE(PERF_CP_BUSY_GFX_CORE_IDLE, UINT64, AVERAGE),
42       COUNTABLE(PERF_CP_BUSY_CYCLES, UINT64, AVERAGE),
43       COUNTABLE(PERF_CP_NUM_PREEMPTIONS, UINT64, AVERAGE),
44       COUNTABLE(PERF_CP_PREEMPTION_REACTION_DELAY, UINT64, AVERAGE),
45       COUNTABLE(PERF_CP_PREEMPTION_SWITCH_OUT_TIME, UINT64, AVERAGE),
46       COUNTABLE(PERF_CP_PREEMPTION_SWITCH_IN_TIME, UINT64, AVERAGE),
47       COUNTABLE(PERF_CP_DEAD_DRAWS_IN_BIN_RENDER, UINT64, AVERAGE),
48       COUNTABLE(PERF_CP_PREDICATED_DRAWS_KILLED, UINT64, AVERAGE),
49       COUNTABLE(PERF_CP_MODE_SWITCH, UINT64, AVERAGE),
50       COUNTABLE(PERF_CP_ZPASS_DONE, UINT64, AVERAGE),
51       COUNTABLE(PERF_CP_CONTEXT_DONE, UINT64, AVERAGE),
52       COUNTABLE(PERF_CP_CACHE_FLUSH, UINT64, AVERAGE),
53       COUNTABLE(PERF_CP_LONG_PREEMPTIONS, UINT64, AVERAGE),
54       COUNTABLE(PERF_CP_SQE_I_CACHE_STARVE, UINT64, AVERAGE),
55       COUNTABLE(PERF_CP_SQE_IDLE, UINT64, AVERAGE),
56       COUNTABLE(PERF_CP_SQE_PM4_STARVE_RB_IB, UINT64, AVERAGE),
57       COUNTABLE(PERF_CP_SQE_PM4_STARVE_SDS, UINT64, AVERAGE),
58       COUNTABLE(PERF_CP_SQE_MRB_STARVE, UINT64, AVERAGE),
59       COUNTABLE(PERF_CP_SQE_RRB_STARVE, UINT64, AVERAGE),
60       COUNTABLE(PERF_CP_SQE_VSD_STARVE, UINT64, AVERAGE),
61       COUNTABLE(PERF_CP_VSD_DECODE_STARVE, UINT64, AVERAGE),
62       COUNTABLE(PERF_CP_SQE_PIPE_OUT_STALL, UINT64, AVERAGE),
63       COUNTABLE(PERF_CP_SQE_SYNC_STALL, UINT64, AVERAGE),
64       COUNTABLE(PERF_CP_SQE_PM4_WFI_STALL, UINT64, AVERAGE),
65       COUNTABLE(PERF_CP_SQE_SYS_WFI_STALL, UINT64, AVERAGE),
66       COUNTABLE(PERF_CP_SQE_T4_EXEC, UINT64, AVERAGE),
67       COUNTABLE(PERF_CP_SQE_LOAD_STATE_EXEC, UINT64, AVERAGE),
68       COUNTABLE(PERF_CP_SQE_SAVE_SDS_STATE, UINT64, AVERAGE),
69       COUNTABLE(PERF_CP_SQE_DRAW_EXEC, UINT64, AVERAGE),
70       COUNTABLE(PERF_CP_SQE_CTXT_REG_BUNCH_EXEC, UINT64, AVERAGE),
71       COUNTABLE(PERF_CP_SQE_EXEC_PROFILED, UINT64, AVERAGE),
72       COUNTABLE(PERF_CP_MEMORY_POOL_EMPTY, UINT64, AVERAGE),
73       COUNTABLE(PERF_CP_MEMORY_POOL_SYNC_STALL, UINT64, AVERAGE),
74       COUNTABLE(PERF_CP_MEMORY_POOL_ABOVE_THRESH, UINT64, AVERAGE),
75       COUNTABLE(PERF_CP_AHB_WR_STALL_PRE_DRAWS, UINT64, AVERAGE),
76       COUNTABLE(PERF_CP_AHB_STALL_SQE_GMU, UINT64, AVERAGE),
77       COUNTABLE(PERF_CP_AHB_STALL_SQE_WR_OTHER, UINT64, AVERAGE),
78       COUNTABLE(PERF_CP_AHB_STALL_SQE_RD_OTHER, UINT64, AVERAGE),
79       COUNTABLE(PERF_CP_CLUSTER0_EMPTY, UINT64, AVERAGE),
80       COUNTABLE(PERF_CP_CLUSTER1_EMPTY, UINT64, AVERAGE),
81       COUNTABLE(PERF_CP_CLUSTER2_EMPTY, UINT64, AVERAGE),
82       COUNTABLE(PERF_CP_CLUSTER3_EMPTY, UINT64, AVERAGE),
83       COUNTABLE(PERF_CP_CLUSTER4_EMPTY, UINT64, AVERAGE),
84       COUNTABLE(PERF_CP_CLUSTER5_EMPTY, UINT64, AVERAGE),
85       COUNTABLE(PERF_CP_PM4_DATA, UINT64, AVERAGE),
86       COUNTABLE(PERF_CP_PM4_HEADERS, UINT64, AVERAGE),
87       COUNTABLE(PERF_CP_VBIF_READ_BEATS, UINT64, AVERAGE),
88       COUNTABLE(PERF_CP_VBIF_WRITE_BEATS, UINT64, AVERAGE),
89       COUNTABLE(PERF_CP_SQE_INSTR_COUNTER, UINT64, AVERAGE),
90 };
91 
92 static const struct fd_perfcntr_counter ccu_counters[] = {
93       COUNTER(RB_PERFCTR_CCU_SEL(0), RBBM_PERFCTR_CCU(0), RBBM_PERFCTR_CCU(0)+1),
94       COUNTER(RB_PERFCTR_CCU_SEL(1), RBBM_PERFCTR_CCU(1), RBBM_PERFCTR_CCU(1)+1),
95       COUNTER(RB_PERFCTR_CCU_SEL(2), RBBM_PERFCTR_CCU(2), RBBM_PERFCTR_CCU(2)+1),
96       COUNTER(RB_PERFCTR_CCU_SEL(3), RBBM_PERFCTR_CCU(3), RBBM_PERFCTR_CCU(3)+1),
97       COUNTER(RB_PERFCTR_CCU_SEL(4), RBBM_PERFCTR_CCU(4), RBBM_PERFCTR_CCU(4)+1),
98 };
99 
100 static const struct fd_perfcntr_countable ccu_countables[] = {
101       COUNTABLE(PERF_CCU_BUSY_CYCLES, UINT64, AVERAGE),
102       COUNTABLE(PERF_CCU_STALL_CYCLES_RB_DEPTH_RETURN, UINT64, AVERAGE),
103       COUNTABLE(PERF_CCU_STALL_CYCLES_RB_COLOR_RETURN, UINT64, AVERAGE),
104       COUNTABLE(PERF_CCU_STARVE_CYCLES_FLAG_RETURN, UINT64, AVERAGE),
105       COUNTABLE(PERF_CCU_DEPTH_BLOCKS, UINT64, AVERAGE),
106       COUNTABLE(PERF_CCU_COLOR_BLOCKS, UINT64, AVERAGE),
107       COUNTABLE(PERF_CCU_DEPTH_BLOCK_HIT, UINT64, AVERAGE),
108       COUNTABLE(PERF_CCU_COLOR_BLOCK_HIT, UINT64, AVERAGE),
109       COUNTABLE(PERF_CCU_PARTIAL_BLOCK_READ, UINT64, AVERAGE),
110       COUNTABLE(PERF_CCU_GMEM_READ, UINT64, AVERAGE),
111       COUNTABLE(PERF_CCU_GMEM_WRITE, UINT64, AVERAGE),
112       COUNTABLE(PERF_CCU_DEPTH_READ_FLAG0_COUNT, UINT64, AVERAGE),
113       COUNTABLE(PERF_CCU_DEPTH_READ_FLAG1_COUNT, UINT64, AVERAGE),
114       COUNTABLE(PERF_CCU_DEPTH_READ_FLAG2_COUNT, UINT64, AVERAGE),
115       COUNTABLE(PERF_CCU_DEPTH_READ_FLAG3_COUNT, UINT64, AVERAGE),
116       COUNTABLE(PERF_CCU_DEPTH_READ_FLAG4_COUNT, UINT64, AVERAGE),
117       COUNTABLE(PERF_CCU_DEPTH_READ_FLAG5_COUNT, UINT64, AVERAGE),
118       COUNTABLE(PERF_CCU_DEPTH_READ_FLAG6_COUNT, UINT64, AVERAGE),
119       COUNTABLE(PERF_CCU_DEPTH_READ_FLAG8_COUNT, UINT64, AVERAGE),
120       COUNTABLE(PERF_CCU_COLOR_READ_FLAG0_COUNT, UINT64, AVERAGE),
121       COUNTABLE(PERF_CCU_COLOR_READ_FLAG1_COUNT, UINT64, AVERAGE),
122       COUNTABLE(PERF_CCU_COLOR_READ_FLAG2_COUNT, UINT64, AVERAGE),
123       COUNTABLE(PERF_CCU_COLOR_READ_FLAG3_COUNT, UINT64, AVERAGE),
124       COUNTABLE(PERF_CCU_COLOR_READ_FLAG4_COUNT, UINT64, AVERAGE),
125       COUNTABLE(PERF_CCU_COLOR_READ_FLAG5_COUNT, UINT64, AVERAGE),
126       COUNTABLE(PERF_CCU_COLOR_READ_FLAG6_COUNT, UINT64, AVERAGE),
127       COUNTABLE(PERF_CCU_COLOR_READ_FLAG8_COUNT, UINT64, AVERAGE),
128       COUNTABLE(PERF_CCU_2D_RD_REQ, UINT64, AVERAGE),
129       COUNTABLE(PERF_CCU_2D_WR_REQ, UINT64, AVERAGE),
130 };
131 
132 static const struct fd_perfcntr_counter tse_counters[] = {
133       COUNTER(GRAS_PERFCTR_TSE_SEL(0), RBBM_PERFCTR_TSE(0), RBBM_PERFCTR_TSE(0)+1),
134       COUNTER(GRAS_PERFCTR_TSE_SEL(1), RBBM_PERFCTR_TSE(1), RBBM_PERFCTR_TSE(1)+1),
135       COUNTER(GRAS_PERFCTR_TSE_SEL(2), RBBM_PERFCTR_TSE(2), RBBM_PERFCTR_TSE(2)+1),
136       COUNTER(GRAS_PERFCTR_TSE_SEL(3), RBBM_PERFCTR_TSE(3), RBBM_PERFCTR_TSE(3)+1),
137 };
138 
139 static const struct fd_perfcntr_countable tse_countables[] = {
140       COUNTABLE(PERF_TSE_BUSY_CYCLES, UINT64, AVERAGE),
141       COUNTABLE(PERF_TSE_CLIPPING_CYCLES, UINT64, AVERAGE),
142       COUNTABLE(PERF_TSE_STALL_CYCLES_RAS, UINT64, AVERAGE),
143       COUNTABLE(PERF_TSE_STALL_CYCLES_LRZ_BARYPLANE, UINT64, AVERAGE),
144       COUNTABLE(PERF_TSE_STALL_CYCLES_LRZ_ZPLANE, UINT64, AVERAGE),
145       COUNTABLE(PERF_TSE_STARVE_CYCLES_PC, UINT64, AVERAGE),
146       COUNTABLE(PERF_TSE_INPUT_PRIM, UINT64, AVERAGE),
147       COUNTABLE(PERF_TSE_INPUT_NULL_PRIM, UINT64, AVERAGE),
148       COUNTABLE(PERF_TSE_TRIVAL_REJ_PRIM, UINT64, AVERAGE),
149       COUNTABLE(PERF_TSE_CLIPPED_PRIM, UINT64, AVERAGE),
150       COUNTABLE(PERF_TSE_ZERO_AREA_PRIM, UINT64, AVERAGE),
151       COUNTABLE(PERF_TSE_FACENESS_CULLED_PRIM, UINT64, AVERAGE),
152       COUNTABLE(PERF_TSE_ZERO_PIXEL_PRIM, UINT64, AVERAGE),
153       COUNTABLE(PERF_TSE_OUTPUT_NULL_PRIM, UINT64, AVERAGE),
154       COUNTABLE(PERF_TSE_OUTPUT_VISIBLE_PRIM, UINT64, AVERAGE),
155       COUNTABLE(PERF_TSE_CINVOCATION, UINT64, AVERAGE),
156       COUNTABLE(PERF_TSE_CPRIMITIVES, UINT64, AVERAGE),
157       COUNTABLE(PERF_TSE_2D_INPUT_PRIM, UINT64, AVERAGE),
158       COUNTABLE(PERF_TSE_2D_ALIVE_CYCLES, UINT64, AVERAGE),
159       COUNTABLE(PERF_TSE_CLIP_PLANES, UINT64, AVERAGE),
160 };
161 
162 static const struct fd_perfcntr_counter ras_counters[] = {
163       COUNTER(GRAS_PERFCTR_RAS_SEL(0), RBBM_PERFCTR_RAS(0), RBBM_PERFCTR_RAS(0)+1),
164       COUNTER(GRAS_PERFCTR_RAS_SEL(1), RBBM_PERFCTR_RAS(1), RBBM_PERFCTR_RAS(1)+1),
165       COUNTER(GRAS_PERFCTR_RAS_SEL(2), RBBM_PERFCTR_RAS(2), RBBM_PERFCTR_RAS(2)+1),
166       COUNTER(GRAS_PERFCTR_RAS_SEL(3), RBBM_PERFCTR_RAS(3), RBBM_PERFCTR_RAS(3)+1),
167 };
168 
169 static const struct fd_perfcntr_countable ras_countables[] = {
170       COUNTABLE(PERF_RAS_BUSY_CYCLES, UINT64, AVERAGE),
171       COUNTABLE(PERF_RAS_SUPERTILE_ACTIVE_CYCLES, UINT64, AVERAGE),
172       COUNTABLE(PERF_RAS_STALL_CYCLES_LRZ, UINT64, AVERAGE),
173       COUNTABLE(PERF_RAS_STARVE_CYCLES_TSE, UINT64, AVERAGE),
174       COUNTABLE(PERF_RAS_SUPER_TILES, UINT64, AVERAGE),
175       COUNTABLE(PERF_RAS_8X4_TILES, UINT64, AVERAGE),
176       COUNTABLE(PERF_RAS_MASKGEN_ACTIVE, UINT64, AVERAGE),
177       COUNTABLE(PERF_RAS_FULLY_COVERED_SUPER_TILES, UINT64, AVERAGE),
178       COUNTABLE(PERF_RAS_FULLY_COVERED_8X4_TILES, UINT64, AVERAGE),
179       COUNTABLE(PERF_RAS_PRIM_KILLED_INVISILBE, UINT64, AVERAGE),
180       COUNTABLE(PERF_RAS_SUPERTILE_GEN_ACTIVE_CYCLES, UINT64, AVERAGE),
181       COUNTABLE(PERF_RAS_LRZ_INTF_WORKING_CYCLES, UINT64, AVERAGE),
182       COUNTABLE(PERF_RAS_BLOCKS, UINT64, AVERAGE),
183 };
184 
185 static const struct fd_perfcntr_counter lrz_counters[] = {
186       COUNTER(GRAS_PERFCTR_LRZ_SEL(0), RBBM_PERFCTR_LRZ(0), RBBM_PERFCTR_LRZ(0)+1),
187       COUNTER(GRAS_PERFCTR_LRZ_SEL(1), RBBM_PERFCTR_LRZ(1), RBBM_PERFCTR_LRZ(1)+1),
188       COUNTER(GRAS_PERFCTR_LRZ_SEL(2), RBBM_PERFCTR_LRZ(2), RBBM_PERFCTR_LRZ(2)+1),
189       COUNTER(GRAS_PERFCTR_LRZ_SEL(3), RBBM_PERFCTR_LRZ(3), RBBM_PERFCTR_LRZ(3)+1),
190 };
191 
192 static const struct fd_perfcntr_countable lrz_countables[] = {
193       COUNTABLE(PERF_LRZ_BUSY_CYCLES, UINT64, AVERAGE),
194       COUNTABLE(PERF_LRZ_STARVE_CYCLES_RAS, UINT64, AVERAGE),
195       COUNTABLE(PERF_LRZ_STALL_CYCLES_RB, UINT64, AVERAGE),
196       COUNTABLE(PERF_LRZ_STALL_CYCLES_VSC, UINT64, AVERAGE),
197       COUNTABLE(PERF_LRZ_STALL_CYCLES_VPC, UINT64, AVERAGE),
198       COUNTABLE(PERF_LRZ_STALL_CYCLES_FLAG_PREFETCH, UINT64, AVERAGE),
199       COUNTABLE(PERF_LRZ_STALL_CYCLES_UCHE, UINT64, AVERAGE),
200       COUNTABLE(PERF_LRZ_LRZ_READ, UINT64, AVERAGE),
201       COUNTABLE(PERF_LRZ_LRZ_WRITE, UINT64, AVERAGE),
202       COUNTABLE(PERF_LRZ_READ_LATENCY, UINT64, AVERAGE),
203       COUNTABLE(PERF_LRZ_MERGE_CACHE_UPDATING, UINT64, AVERAGE),
204       COUNTABLE(PERF_LRZ_PRIM_KILLED_BY_MASKGEN, UINT64, AVERAGE),
205       COUNTABLE(PERF_LRZ_PRIM_KILLED_BY_LRZ, UINT64, AVERAGE),
206       COUNTABLE(PERF_LRZ_VISIBLE_PRIM_AFTER_LRZ, UINT64, AVERAGE),
207       COUNTABLE(PERF_LRZ_FULL_8X8_TILES, UINT64, AVERAGE),
208       COUNTABLE(PERF_LRZ_PARTIAL_8X8_TILES, UINT64, AVERAGE),
209       COUNTABLE(PERF_LRZ_TILE_KILLED, UINT64, AVERAGE),
210       COUNTABLE(PERF_LRZ_TOTAL_PIXEL, UINT64, AVERAGE),
211       COUNTABLE(PERF_LRZ_VISIBLE_PIXEL_AFTER_LRZ, UINT64, AVERAGE),
212       COUNTABLE(PERF_LRZ_FULLY_COVERED_TILES, UINT64, AVERAGE),
213       COUNTABLE(PERF_LRZ_PARTIAL_COVERED_TILES, UINT64, AVERAGE),
214       COUNTABLE(PERF_LRZ_FEEDBACK_ACCEPT, UINT64, AVERAGE),
215       COUNTABLE(PERF_LRZ_FEEDBACK_DISCARD, UINT64, AVERAGE),
216       COUNTABLE(PERF_LRZ_FEEDBACK_STALL, UINT64, AVERAGE),
217       COUNTABLE(PERF_LRZ_STALL_CYCLES_RB_ZPLANE, UINT64, AVERAGE),
218       COUNTABLE(PERF_LRZ_STALL_CYCLES_RB_BPLANE, UINT64, AVERAGE),
219       COUNTABLE(PERF_LRZ_STALL_CYCLES_VC, UINT64, AVERAGE),
220       COUNTABLE(PERF_LRZ_RAS_MASK_TRANS, UINT64, AVERAGE),
221 };
222 
223 static const struct fd_perfcntr_counter hlsq_counters[] = {
224       COUNTER(HLSQ_PERFCTR_HLSQ_SEL(0), RBBM_PERFCTR_HLSQ(0), RBBM_PERFCTR_HLSQ(0)+1),
225       COUNTER(HLSQ_PERFCTR_HLSQ_SEL(1), RBBM_PERFCTR_HLSQ(1), RBBM_PERFCTR_HLSQ(1)+1),
226       COUNTER(HLSQ_PERFCTR_HLSQ_SEL(2), RBBM_PERFCTR_HLSQ(2), RBBM_PERFCTR_HLSQ(2)+1),
227       COUNTER(HLSQ_PERFCTR_HLSQ_SEL(3), RBBM_PERFCTR_HLSQ(3), RBBM_PERFCTR_HLSQ(3)+1),
228       COUNTER(HLSQ_PERFCTR_HLSQ_SEL(4), RBBM_PERFCTR_HLSQ(4), RBBM_PERFCTR_HLSQ(4)+1),
229       COUNTER(HLSQ_PERFCTR_HLSQ_SEL(5), RBBM_PERFCTR_HLSQ(5), RBBM_PERFCTR_HLSQ(5)+1),
230       // TODO did we loose some HLSQ counters or are they just missing from xml
231       //	COUNTER(HLSQ_PERFCTR_HLSQ_SEL(6), RBBM_PERFCTR_HLSQ(6), RBBM_PERFCTR_HLSQ(6)+1),
232       //	COUNTER(HLSQ_PERFCTR_HLSQ_SEL(7), RBBM_PERFCTR_HLSQ(7), RBBM_PERFCTR_HLSQ(7)+1),
233 };
234 
235 static const struct fd_perfcntr_countable hlsq_countables[] = {
236       COUNTABLE(PERF_HLSQ_BUSY_CYCLES, UINT64, AVERAGE),
237       COUNTABLE(PERF_HLSQ_STALL_CYCLES_UCHE, UINT64, AVERAGE),
238       COUNTABLE(PERF_HLSQ_STALL_CYCLES_SP_STATE, UINT64, AVERAGE),
239       COUNTABLE(PERF_HLSQ_STALL_CYCLES_SP_FS_STAGE, UINT64, AVERAGE),
240       COUNTABLE(PERF_HLSQ_UCHE_LATENCY_CYCLES, UINT64, AVERAGE),
241       COUNTABLE(PERF_HLSQ_UCHE_LATENCY_COUNT, UINT64, AVERAGE),
242       COUNTABLE(PERF_HLSQ_FS_STAGE_1X_WAVES, UINT64, AVERAGE),
243       COUNTABLE(PERF_HLSQ_FS_STAGE_2X_WAVES, UINT64, AVERAGE),
244       COUNTABLE(PERF_HLSQ_QUADS, UINT64, AVERAGE),
245       COUNTABLE(PERF_HLSQ_CS_INVOCATIONS, UINT64, AVERAGE),
246       COUNTABLE(PERF_HLSQ_COMPUTE_DRAWCALLS, UINT64, AVERAGE),
247       COUNTABLE(PERF_HLSQ_FS_DATA_WAIT_PROGRAMMING, UINT64, AVERAGE),
248       COUNTABLE(PERF_HLSQ_DUAL_FS_PROG_ACTIVE, UINT64, AVERAGE),
249       COUNTABLE(PERF_HLSQ_DUAL_VS_PROG_ACTIVE, UINT64, AVERAGE),
250       COUNTABLE(PERF_HLSQ_FS_BATCH_COUNT_ZERO, UINT64, AVERAGE),
251       COUNTABLE(PERF_HLSQ_VS_BATCH_COUNT_ZERO, UINT64, AVERAGE),
252       COUNTABLE(PERF_HLSQ_WAVE_PENDING_NO_QUAD, UINT64, AVERAGE),
253       COUNTABLE(PERF_HLSQ_WAVE_PENDING_NO_PRIM_BASE, UINT64, AVERAGE),
254       COUNTABLE(PERF_HLSQ_STALL_CYCLES_VPC, UINT64, AVERAGE),
255       COUNTABLE(PERF_HLSQ_PIXELS, UINT64, AVERAGE),
256       COUNTABLE(PERF_HLSQ_DRAW_MODE_SWITCH_VSFS_SYNC, UINT64, AVERAGE),
257 };
258 
259 static const struct fd_perfcntr_counter pc_counters[] = {
260       COUNTER(PC_PERFCTR_PC_SEL(0), RBBM_PERFCTR_PC(0), RBBM_PERFCTR_PC(0)+1),
261       COUNTER(PC_PERFCTR_PC_SEL(1), RBBM_PERFCTR_PC(1), RBBM_PERFCTR_PC(1)+1),
262       COUNTER(PC_PERFCTR_PC_SEL(2), RBBM_PERFCTR_PC(2), RBBM_PERFCTR_PC(2)+1),
263       COUNTER(PC_PERFCTR_PC_SEL(3), RBBM_PERFCTR_PC(3), RBBM_PERFCTR_PC(3)+1),
264       COUNTER(PC_PERFCTR_PC_SEL(4), RBBM_PERFCTR_PC(4), RBBM_PERFCTR_PC(4)+1),
265       COUNTER(PC_PERFCTR_PC_SEL(5), RBBM_PERFCTR_PC(5), RBBM_PERFCTR_PC(5)+1),
266       COUNTER(PC_PERFCTR_PC_SEL(6), RBBM_PERFCTR_PC(6), RBBM_PERFCTR_PC(6)+1),
267       COUNTER(PC_PERFCTR_PC_SEL(7), RBBM_PERFCTR_PC(7), RBBM_PERFCTR_PC(7)+1),
268 };
269 
270 static const struct fd_perfcntr_countable pc_countables[] = {
271       COUNTABLE(PERF_PC_BUSY_CYCLES, UINT64, AVERAGE),
272       COUNTABLE(PERF_PC_WORKING_CYCLES, UINT64, AVERAGE),
273       COUNTABLE(PERF_PC_STALL_CYCLES_VFD, UINT64, AVERAGE),
274       COUNTABLE(PERF_PC_STALL_CYCLES_TSE, UINT64, AVERAGE),
275       COUNTABLE(PERF_PC_STALL_CYCLES_VPC, UINT64, AVERAGE),
276       COUNTABLE(PERF_PC_STALL_CYCLES_UCHE, UINT64, AVERAGE),
277       COUNTABLE(PERF_PC_STALL_CYCLES_TESS, UINT64, AVERAGE),
278       COUNTABLE(PERF_PC_STALL_CYCLES_TSE_ONLY, UINT64, AVERAGE),
279       COUNTABLE(PERF_PC_STALL_CYCLES_VPC_ONLY, UINT64, AVERAGE),
280       COUNTABLE(PERF_PC_PASS1_TF_STALL_CYCLES, UINT64, AVERAGE),
281       COUNTABLE(PERF_PC_STARVE_CYCLES_FOR_INDEX, UINT64, AVERAGE),
282       COUNTABLE(PERF_PC_STARVE_CYCLES_FOR_TESS_FACTOR, UINT64, AVERAGE),
283       COUNTABLE(PERF_PC_STARVE_CYCLES_FOR_VIZ_STREAM, UINT64, AVERAGE),
284       COUNTABLE(PERF_PC_STARVE_CYCLES_FOR_POSITION, UINT64, AVERAGE),
285       COUNTABLE(PERF_PC_STARVE_CYCLES_DI, UINT64, AVERAGE),
286       COUNTABLE(PERF_PC_VIS_STREAMS_LOADED, UINT64, AVERAGE),
287       COUNTABLE(PERF_PC_INSTANCES, UINT64, AVERAGE),
288       COUNTABLE(PERF_PC_VPC_PRIMITIVES, UINT64, AVERAGE),
289       COUNTABLE(PERF_PC_DEAD_PRIM, UINT64, AVERAGE),
290       COUNTABLE(PERF_PC_LIVE_PRIM, UINT64, AVERAGE),
291       COUNTABLE(PERF_PC_VERTEX_HITS, UINT64, AVERAGE),
292       COUNTABLE(PERF_PC_IA_VERTICES, UINT64, AVERAGE),
293       COUNTABLE(PERF_PC_IA_PRIMITIVES, UINT64, AVERAGE),
294       COUNTABLE(PERF_PC_GS_PRIMITIVES, UINT64, AVERAGE),
295       COUNTABLE(PERF_PC_HS_INVOCATIONS, UINT64, AVERAGE),
296       COUNTABLE(PERF_PC_DS_INVOCATIONS, UINT64, AVERAGE),
297       COUNTABLE(PERF_PC_VS_INVOCATIONS, UINT64, AVERAGE),
298       COUNTABLE(PERF_PC_GS_INVOCATIONS, UINT64, AVERAGE),
299       COUNTABLE(PERF_PC_DS_PRIMITIVES, UINT64, AVERAGE),
300       COUNTABLE(PERF_PC_VPC_POS_DATA_TRANSACTION, UINT64, AVERAGE),
301       COUNTABLE(PERF_PC_3D_DRAWCALLS, UINT64, AVERAGE),
302       COUNTABLE(PERF_PC_2D_DRAWCALLS, UINT64, AVERAGE),
303       COUNTABLE(PERF_PC_NON_DRAWCALL_GLOBAL_EVENTS, UINT64, AVERAGE),
304       COUNTABLE(PERF_TESS_BUSY_CYCLES, UINT64, AVERAGE),
305       COUNTABLE(PERF_TESS_WORKING_CYCLES, UINT64, AVERAGE),
306       COUNTABLE(PERF_TESS_STALL_CYCLES_PC, UINT64, AVERAGE),
307       COUNTABLE(PERF_TESS_STARVE_CYCLES_PC, UINT64, AVERAGE),
308       COUNTABLE(PERF_PC_TSE_TRANSACTION, UINT64, AVERAGE),
309       COUNTABLE(PERF_PC_TSE_VERTEX, UINT64, AVERAGE),
310       COUNTABLE(PERF_PC_TESS_PC_UV_TRANS, UINT64, AVERAGE),
311       COUNTABLE(PERF_PC_TESS_PC_UV_PATCHES, UINT64, AVERAGE),
312       COUNTABLE(PERF_PC_TESS_FACTOR_TRANS, UINT64, AVERAGE),
313 };
314 
315 static const struct fd_perfcntr_counter rb_counters[] = {
316       COUNTER(RB_PERFCTR_RB_SEL(0), RBBM_PERFCTR_RB(0), RBBM_PERFCTR_RB(0)+1),
317       COUNTER(RB_PERFCTR_RB_SEL(1), RBBM_PERFCTR_RB(1), RBBM_PERFCTR_RB(1)+1),
318       COUNTER(RB_PERFCTR_RB_SEL(2), RBBM_PERFCTR_RB(2), RBBM_PERFCTR_RB(2)+1),
319       COUNTER(RB_PERFCTR_RB_SEL(3), RBBM_PERFCTR_RB(3), RBBM_PERFCTR_RB(3)+1),
320       COUNTER(RB_PERFCTR_RB_SEL(4), RBBM_PERFCTR_RB(4), RBBM_PERFCTR_RB(4)+1),
321       COUNTER(RB_PERFCTR_RB_SEL(5), RBBM_PERFCTR_RB(5), RBBM_PERFCTR_RB(5)+1),
322       COUNTER(RB_PERFCTR_RB_SEL(6), RBBM_PERFCTR_RB(6), RBBM_PERFCTR_RB(6)+1),
323       COUNTER(RB_PERFCTR_RB_SEL(7), RBBM_PERFCTR_RB(7), RBBM_PERFCTR_RB(7)+1),
324 };
325 
326 static const struct fd_perfcntr_countable rb_countables[] = {
327       COUNTABLE(PERF_RB_BUSY_CYCLES, UINT64, AVERAGE),
328       COUNTABLE(PERF_RB_STALL_CYCLES_HLSQ, UINT64, AVERAGE),
329       COUNTABLE(PERF_RB_STALL_CYCLES_FIFO0_FULL, UINT64, AVERAGE),
330       COUNTABLE(PERF_RB_STALL_CYCLES_FIFO1_FULL, UINT64, AVERAGE),
331       COUNTABLE(PERF_RB_STALL_CYCLES_FIFO2_FULL, UINT64, AVERAGE),
332       COUNTABLE(PERF_RB_STARVE_CYCLES_SP, UINT64, AVERAGE),
333       COUNTABLE(PERF_RB_STARVE_CYCLES_LRZ_TILE, UINT64, AVERAGE),
334       COUNTABLE(PERF_RB_STARVE_CYCLES_CCU, UINT64, AVERAGE),
335       COUNTABLE(PERF_RB_STARVE_CYCLES_Z_PLANE, UINT64, AVERAGE),
336       COUNTABLE(PERF_RB_STARVE_CYCLES_BARY_PLANE, UINT64, AVERAGE),
337       COUNTABLE(PERF_RB_Z_WORKLOAD, UINT64, AVERAGE),
338       COUNTABLE(PERF_RB_HLSQ_ACTIVE, UINT64, AVERAGE),
339       COUNTABLE(PERF_RB_Z_READ, UINT64, AVERAGE),
340       COUNTABLE(PERF_RB_Z_WRITE, UINT64, AVERAGE),
341       COUNTABLE(PERF_RB_C_READ, UINT64, AVERAGE),
342       COUNTABLE(PERF_RB_C_WRITE, UINT64, AVERAGE),
343       COUNTABLE(PERF_RB_TOTAL_PASS, UINT64, AVERAGE),
344       COUNTABLE(PERF_RB_Z_PASS, UINT64, AVERAGE),
345       COUNTABLE(PERF_RB_Z_FAIL, UINT64, AVERAGE),
346       COUNTABLE(PERF_RB_S_FAIL, UINT64, AVERAGE),
347       COUNTABLE(PERF_RB_BLENDED_FXP_COMPONENTS, UINT64, AVERAGE),
348       COUNTABLE(PERF_RB_BLENDED_FP16_COMPONENTS, UINT64, AVERAGE),
349       COUNTABLE(PERF_RB_PS_INVOCATIONS, UINT64, AVERAGE),
350       COUNTABLE(PERF_RB_2D_ALIVE_CYCLES, UINT64, AVERAGE),
351       COUNTABLE(PERF_RB_2D_STALL_CYCLES_A2D, UINT64, AVERAGE),
352       COUNTABLE(PERF_RB_2D_STARVE_CYCLES_SRC, UINT64, AVERAGE),
353       COUNTABLE(PERF_RB_2D_STARVE_CYCLES_SP, UINT64, AVERAGE),
354       COUNTABLE(PERF_RB_2D_STARVE_CYCLES_DST, UINT64, AVERAGE),
355       COUNTABLE(PERF_RB_2D_VALID_PIXELS, UINT64, AVERAGE),
356       COUNTABLE(PERF_RB_3D_PIXELS, UINT64, AVERAGE),
357       COUNTABLE(PERF_RB_BLENDER_WORKING_CYCLES, UINT64, AVERAGE),
358       COUNTABLE(PERF_RB_ZPROC_WORKING_CYCLES, UINT64, AVERAGE),
359       COUNTABLE(PERF_RB_CPROC_WORKING_CYCLES, UINT64, AVERAGE),
360       COUNTABLE(PERF_RB_SAMPLER_WORKING_CYCLES, UINT64, AVERAGE),
361       COUNTABLE(PERF_RB_STALL_CYCLES_CCU_COLOR_READ, UINT64, AVERAGE),
362       COUNTABLE(PERF_RB_STALL_CYCLES_CCU_COLOR_WRITE, UINT64, AVERAGE),
363       COUNTABLE(PERF_RB_STALL_CYCLES_CCU_DEPTH_READ, UINT64, AVERAGE),
364       COUNTABLE(PERF_RB_STALL_CYCLES_CCU_DEPTH_WRITE, UINT64, AVERAGE),
365       COUNTABLE(PERF_RB_STALL_CYCLES_VPC, UINT64, AVERAGE),
366       COUNTABLE(PERF_RB_2D_INPUT_TRANS, UINT64, AVERAGE),
367       COUNTABLE(PERF_RB_2D_OUTPUT_RB_DST_TRANS, UINT64, AVERAGE),
368       COUNTABLE(PERF_RB_2D_OUTPUT_RB_SRC_TRANS, UINT64, AVERAGE),
369       COUNTABLE(PERF_RB_BLENDED_FP32_COMPONENTS, UINT64, AVERAGE),
370       COUNTABLE(PERF_RB_COLOR_PIX_TILES, UINT64, AVERAGE),
371       COUNTABLE(PERF_RB_STALL_CYCLES_CCU, UINT64, AVERAGE),
372       COUNTABLE(PERF_RB_EARLY_Z_ARB3_GRANT, UINT64, AVERAGE),
373       COUNTABLE(PERF_RB_LATE_Z_ARB3_GRANT, UINT64, AVERAGE),
374       COUNTABLE(PERF_RB_EARLY_Z_SKIP_GRANT, UINT64, AVERAGE),
375 };
376 
377 UNUSED static const struct fd_perfcntr_counter rbbm_counters[] = {
378       //RESERVED: for kernel
379       //	COUNTER(RBBM_PERFCTR_RBBM_SEL(0), RBBM_PERFCTR_RBBM(0), RBBM_PERFCTR_RBBM(0)+1),
380       COUNTER(RBBM_PERFCTR_RBBM_SEL(1), RBBM_PERFCTR_RBBM(1), RBBM_PERFCTR_RBBM(1)+1),
381       COUNTER(RBBM_PERFCTR_RBBM_SEL(2), RBBM_PERFCTR_RBBM(2), RBBM_PERFCTR_RBBM(2)+1),
382       COUNTER(RBBM_PERFCTR_RBBM_SEL(3), RBBM_PERFCTR_RBBM(3), RBBM_PERFCTR_RBBM(3)+1),
383 };
384 
385 UNUSED static const struct fd_perfcntr_countable rbbm_countables[] = {
386       COUNTABLE(PERF_RBBM_ALWAYS_COUNT, UINT64, AVERAGE),
387       COUNTABLE(PERF_RBBM_ALWAYS_ON, UINT64, AVERAGE),
388       COUNTABLE(PERF_RBBM_TSE_BUSY, UINT64, AVERAGE),
389       COUNTABLE(PERF_RBBM_RAS_BUSY, UINT64, AVERAGE),
390       COUNTABLE(PERF_RBBM_PC_DCALL_BUSY, UINT64, AVERAGE),
391       COUNTABLE(PERF_RBBM_PC_VSD_BUSY, UINT64, AVERAGE),
392       COUNTABLE(PERF_RBBM_STATUS_MASKED, UINT64, AVERAGE),
393       COUNTABLE(PERF_RBBM_COM_BUSY, UINT64, AVERAGE),
394       COUNTABLE(PERF_RBBM_DCOM_BUSY, UINT64, AVERAGE),
395       COUNTABLE(PERF_RBBM_VBIF_BUSY, UINT64, AVERAGE),
396       COUNTABLE(PERF_RBBM_VSC_BUSY, UINT64, AVERAGE),
397       COUNTABLE(PERF_RBBM_TESS_BUSY, UINT64, AVERAGE),
398       COUNTABLE(PERF_RBBM_UCHE_BUSY, UINT64, AVERAGE),
399       COUNTABLE(PERF_RBBM_HLSQ_BUSY, UINT64, AVERAGE),
400 };
401 
402 static const struct fd_perfcntr_counter sp_counters[] = {
403       //RESERVED: for kernel
404       //	COUNTER(SP_PERFCTR_SP_SEL(0),  RBBM_PERFCTR_SP(0),  RBBM_PERFCTR_SP(0)+1),
405       COUNTER(SP_PERFCTR_SP_SEL(1),  RBBM_PERFCTR_SP(1),  RBBM_PERFCTR_SP(1)+1),
406       COUNTER(SP_PERFCTR_SP_SEL(2),  RBBM_PERFCTR_SP(2),  RBBM_PERFCTR_SP(2)+1),
407       COUNTER(SP_PERFCTR_SP_SEL(3),  RBBM_PERFCTR_SP(3),  RBBM_PERFCTR_SP(3)+1),
408       COUNTER(SP_PERFCTR_SP_SEL(4),  RBBM_PERFCTR_SP(4),  RBBM_PERFCTR_SP(4)+1),
409       COUNTER(SP_PERFCTR_SP_SEL(5),  RBBM_PERFCTR_SP(5),  RBBM_PERFCTR_SP(5)+1),
410       COUNTER(SP_PERFCTR_SP_SEL(6),  RBBM_PERFCTR_SP(6),  RBBM_PERFCTR_SP(6)+1),
411       COUNTER(SP_PERFCTR_SP_SEL(7),  RBBM_PERFCTR_SP(7),  RBBM_PERFCTR_SP(7)+1),
412       COUNTER(SP_PERFCTR_SP_SEL(8),  RBBM_PERFCTR_SP(8),  RBBM_PERFCTR_SP(8)+1),
413       COUNTER(SP_PERFCTR_SP_SEL(9),  RBBM_PERFCTR_SP(9),  RBBM_PERFCTR_SP(9)+1),
414       COUNTER(SP_PERFCTR_SP_SEL(10), RBBM_PERFCTR_SP(10), RBBM_PERFCTR_SP(10)+1),
415       COUNTER(SP_PERFCTR_SP_SEL(11), RBBM_PERFCTR_SP(11), RBBM_PERFCTR_SP(11)+1),
416       COUNTER(SP_PERFCTR_SP_SEL(12), RBBM_PERFCTR_SP(12), RBBM_PERFCTR_SP(12)+1),
417       COUNTER(SP_PERFCTR_SP_SEL(13), RBBM_PERFCTR_SP(13), RBBM_PERFCTR_SP(13)+1),
418       COUNTER(SP_PERFCTR_SP_SEL(14), RBBM_PERFCTR_SP(14), RBBM_PERFCTR_SP(14)+1),
419       COUNTER(SP_PERFCTR_SP_SEL(15), RBBM_PERFCTR_SP(15), RBBM_PERFCTR_SP(15)+1),
420       COUNTER(SP_PERFCTR_SP_SEL(16), RBBM_PERFCTR_SP(16), RBBM_PERFCTR_SP(16)+1),
421       COUNTER(SP_PERFCTR_SP_SEL(17), RBBM_PERFCTR_SP(17), RBBM_PERFCTR_SP(17)+1),
422       COUNTER(SP_PERFCTR_SP_SEL(18), RBBM_PERFCTR_SP(18), RBBM_PERFCTR_SP(18)+1),
423       COUNTER(SP_PERFCTR_SP_SEL(19), RBBM_PERFCTR_SP(19), RBBM_PERFCTR_SP(19)+1),
424       COUNTER(SP_PERFCTR_SP_SEL(20), RBBM_PERFCTR_SP(20), RBBM_PERFCTR_SP(20)+1),
425       COUNTER(SP_PERFCTR_SP_SEL(21), RBBM_PERFCTR_SP(21), RBBM_PERFCTR_SP(21)+1),
426       COUNTER(SP_PERFCTR_SP_SEL(22), RBBM_PERFCTR_SP(22), RBBM_PERFCTR_SP(22)+1),
427       COUNTER(SP_PERFCTR_SP_SEL(23), RBBM_PERFCTR_SP(23), RBBM_PERFCTR_SP(23)+1),
428 };
429 
430 static const struct fd_perfcntr_countable sp_countables[] = {
431       COUNTABLE(PERF_SP_BUSY_CYCLES, UINT64, AVERAGE),
432       COUNTABLE(PERF_SP_ALU_WORKING_CYCLES, UINT64, AVERAGE),
433       COUNTABLE(PERF_SP_EFU_WORKING_CYCLES, UINT64, AVERAGE),
434       COUNTABLE(PERF_SP_STALL_CYCLES_VPC, UINT64, AVERAGE),
435       COUNTABLE(PERF_SP_STALL_CYCLES_TP, UINT64, AVERAGE),
436       COUNTABLE(PERF_SP_STALL_CYCLES_UCHE, UINT64, AVERAGE),
437       COUNTABLE(PERF_SP_STALL_CYCLES_RB, UINT64, AVERAGE),
438       COUNTABLE(PERF_SP_NON_EXECUTION_CYCLES, UINT64, AVERAGE),
439       COUNTABLE(PERF_SP_WAVE_CONTEXTS, UINT64, AVERAGE),
440       COUNTABLE(PERF_SP_WAVE_CONTEXT_CYCLES, UINT64, AVERAGE),
441       COUNTABLE(PERF_SP_FS_STAGE_WAVE_CYCLES, UINT64, AVERAGE),
442       COUNTABLE(PERF_SP_FS_STAGE_WAVE_SAMPLES, UINT64, AVERAGE),
443       COUNTABLE(PERF_SP_VS_STAGE_WAVE_CYCLES, UINT64, AVERAGE),
444       COUNTABLE(PERF_SP_VS_STAGE_WAVE_SAMPLES, UINT64, AVERAGE),
445       COUNTABLE(PERF_SP_FS_STAGE_DURATION_CYCLES, UINT64, AVERAGE),
446       COUNTABLE(PERF_SP_VS_STAGE_DURATION_CYCLES, UINT64, AVERAGE),
447       COUNTABLE(PERF_SP_WAVE_CTRL_CYCLES, UINT64, AVERAGE),
448       COUNTABLE(PERF_SP_WAVE_LOAD_CYCLES, UINT64, AVERAGE),
449       COUNTABLE(PERF_SP_WAVE_EMIT_CYCLES, UINT64, AVERAGE),
450       COUNTABLE(PERF_SP_WAVE_NOP_CYCLES, UINT64, AVERAGE),
451       COUNTABLE(PERF_SP_WAVE_WAIT_CYCLES, UINT64, AVERAGE),
452       COUNTABLE(PERF_SP_WAVE_FETCH_CYCLES, UINT64, AVERAGE),
453       COUNTABLE(PERF_SP_WAVE_IDLE_CYCLES, UINT64, AVERAGE),
454       COUNTABLE(PERF_SP_WAVE_END_CYCLES, UINT64, AVERAGE),
455       COUNTABLE(PERF_SP_WAVE_LONG_SYNC_CYCLES, UINT64, AVERAGE),
456       COUNTABLE(PERF_SP_WAVE_SHORT_SYNC_CYCLES, UINT64, AVERAGE),
457       COUNTABLE(PERF_SP_WAVE_JOIN_CYCLES, UINT64, AVERAGE),
458       COUNTABLE(PERF_SP_LM_LOAD_INSTRUCTIONS, UINT64, AVERAGE),
459       COUNTABLE(PERF_SP_LM_STORE_INSTRUCTIONS, UINT64, AVERAGE),
460       COUNTABLE(PERF_SP_LM_ATOMICS, UINT64, AVERAGE),
461       COUNTABLE(PERF_SP_GM_LOAD_INSTRUCTIONS, UINT64, AVERAGE),
462       COUNTABLE(PERF_SP_GM_STORE_INSTRUCTIONS, UINT64, AVERAGE),
463       COUNTABLE(PERF_SP_GM_ATOMICS, UINT64, AVERAGE),
464       COUNTABLE(PERF_SP_VS_STAGE_TEX_INSTRUCTIONS, UINT64, AVERAGE),
465       COUNTABLE(PERF_SP_VS_STAGE_EFU_INSTRUCTIONS, UINT64, AVERAGE),
466       COUNTABLE(PERF_SP_VS_STAGE_FULL_ALU_INSTRUCTIONS, UINT64, AVERAGE),
467       COUNTABLE(PERF_SP_VS_STAGE_HALF_ALU_INSTRUCTIONS, UINT64, AVERAGE),
468       COUNTABLE(PERF_SP_FS_STAGE_TEX_INSTRUCTIONS, UINT64, AVERAGE),
469       COUNTABLE(PERF_SP_FS_STAGE_CFLOW_INSTRUCTIONS, UINT64, AVERAGE),
470       COUNTABLE(PERF_SP_FS_STAGE_EFU_INSTRUCTIONS, UINT64, AVERAGE),
471       COUNTABLE(PERF_SP_FS_STAGE_FULL_ALU_INSTRUCTIONS, UINT64, AVERAGE),
472       COUNTABLE(PERF_SP_FS_STAGE_HALF_ALU_INSTRUCTIONS, UINT64, AVERAGE),
473       COUNTABLE(PERF_SP_FS_STAGE_BARY_INSTRUCTIONS, UINT64, AVERAGE),
474       COUNTABLE(PERF_SP_VS_INSTRUCTIONS, UINT64, AVERAGE),
475       COUNTABLE(PERF_SP_FS_INSTRUCTIONS, UINT64, AVERAGE),
476       COUNTABLE(PERF_SP_ADDR_LOCK_COUNT, UINT64, AVERAGE),
477       COUNTABLE(PERF_SP_UCHE_READ_TRANS, UINT64, AVERAGE),
478       COUNTABLE(PERF_SP_UCHE_WRITE_TRANS, UINT64, AVERAGE),
479       COUNTABLE(PERF_SP_EXPORT_VPC_TRANS, UINT64, AVERAGE),
480       COUNTABLE(PERF_SP_EXPORT_RB_TRANS, UINT64, AVERAGE),
481       COUNTABLE(PERF_SP_PIXELS_KILLED, UINT64, AVERAGE),
482       COUNTABLE(PERF_SP_ICL1_REQUESTS, UINT64, AVERAGE),
483       COUNTABLE(PERF_SP_ICL1_MISSES, UINT64, AVERAGE),
484       COUNTABLE(PERF_SP_HS_INSTRUCTIONS, UINT64, AVERAGE),
485       COUNTABLE(PERF_SP_DS_INSTRUCTIONS, UINT64, AVERAGE),
486       COUNTABLE(PERF_SP_GS_INSTRUCTIONS, UINT64, AVERAGE),
487       COUNTABLE(PERF_SP_CS_INSTRUCTIONS, UINT64, AVERAGE),
488       COUNTABLE(PERF_SP_GPR_READ, UINT64, AVERAGE),
489       COUNTABLE(PERF_SP_GPR_WRITE, UINT64, AVERAGE),
490       COUNTABLE(PERF_SP_FS_STAGE_HALF_EFU_INSTRUCTIONS, UINT64, AVERAGE),
491       COUNTABLE(PERF_SP_VS_STAGE_HALF_EFU_INSTRUCTIONS, UINT64, AVERAGE),
492       COUNTABLE(PERF_SP_LM_BANK_CONFLICTS, UINT64, AVERAGE),
493       COUNTABLE(PERF_SP_TEX_CONTROL_WORKING_CYCLES, UINT64, AVERAGE),
494       COUNTABLE(PERF_SP_LOAD_CONTROL_WORKING_CYCLES, UINT64, AVERAGE),
495       COUNTABLE(PERF_SP_FLOW_CONTROL_WORKING_CYCLES, UINT64, AVERAGE),
496       COUNTABLE(PERF_SP_LM_WORKING_CYCLES, UINT64, AVERAGE),
497       COUNTABLE(PERF_SP_DISPATCHER_WORKING_CYCLES, UINT64, AVERAGE),
498       COUNTABLE(PERF_SP_SEQUENCER_WORKING_CYCLES, UINT64, AVERAGE),
499       COUNTABLE(PERF_SP_LOW_EFFICIENCY_STARVED_BY_TP, UINT64, AVERAGE),
500       COUNTABLE(PERF_SP_STARVE_CYCLES_HLSQ, UINT64, AVERAGE),
501       COUNTABLE(PERF_SP_NON_EXECUTION_LS_CYCLES, UINT64, AVERAGE),
502       COUNTABLE(PERF_SP_WORKING_EU, UINT64, AVERAGE),
503       COUNTABLE(PERF_SP_ANY_EU_WORKING, UINT64, AVERAGE),
504       COUNTABLE(PERF_SP_WORKING_EU_FS_STAGE, UINT64, AVERAGE),
505       COUNTABLE(PERF_SP_ANY_EU_WORKING_FS_STAGE, UINT64, AVERAGE),
506       COUNTABLE(PERF_SP_WORKING_EU_VS_STAGE, UINT64, AVERAGE),
507       COUNTABLE(PERF_SP_ANY_EU_WORKING_VS_STAGE, UINT64, AVERAGE),
508       COUNTABLE(PERF_SP_WORKING_EU_CS_STAGE, UINT64, AVERAGE),
509       COUNTABLE(PERF_SP_ANY_EU_WORKING_CS_STAGE, UINT64, AVERAGE),
510       COUNTABLE(PERF_SP_GPR_READ_PREFETCH, UINT64, AVERAGE),
511       COUNTABLE(PERF_SP_GPR_READ_CONFLICT, UINT64, AVERAGE),
512       COUNTABLE(PERF_SP_GPR_WRITE_CONFLICT, UINT64, AVERAGE),
513       COUNTABLE(PERF_SP_GM_LOAD_LATENCY_CYCLES, UINT64, AVERAGE),
514       COUNTABLE(PERF_SP_GM_LOAD_LATENCY_SAMPLES, UINT64, AVERAGE),
515       COUNTABLE(PERF_SP_EXECUTABLE_WAVES, UINT64, AVERAGE),
516 };
517 
518 static const struct fd_perfcntr_counter tp_counters[] = {
519       COUNTER(TPL1_PERFCTR_TP_SEL(0),  RBBM_PERFCTR_TP(0),  RBBM_PERFCTR_TP(0)+1),
520       COUNTER(TPL1_PERFCTR_TP_SEL(1),  RBBM_PERFCTR_TP(1),  RBBM_PERFCTR_TP(1)+1),
521       COUNTER(TPL1_PERFCTR_TP_SEL(2),  RBBM_PERFCTR_TP(2),  RBBM_PERFCTR_TP(2)+1),
522       COUNTER(TPL1_PERFCTR_TP_SEL(3),  RBBM_PERFCTR_TP(3),  RBBM_PERFCTR_TP(3)+1),
523       COUNTER(TPL1_PERFCTR_TP_SEL(4),  RBBM_PERFCTR_TP(4),  RBBM_PERFCTR_TP(4)+1),
524       COUNTER(TPL1_PERFCTR_TP_SEL(5),  RBBM_PERFCTR_TP(5),  RBBM_PERFCTR_TP(5)+1),
525       COUNTER(TPL1_PERFCTR_TP_SEL(6),  RBBM_PERFCTR_TP(6),  RBBM_PERFCTR_TP(6)+1),
526       COUNTER(TPL1_PERFCTR_TP_SEL(7),  RBBM_PERFCTR_TP(7),  RBBM_PERFCTR_TP(7)+1),
527       COUNTER(TPL1_PERFCTR_TP_SEL(8),  RBBM_PERFCTR_TP(8),  RBBM_PERFCTR_TP(8)+1),
528       COUNTER(TPL1_PERFCTR_TP_SEL(9),  RBBM_PERFCTR_TP(9),  RBBM_PERFCTR_TP(9)+1),
529       COUNTER(TPL1_PERFCTR_TP_SEL(10), RBBM_PERFCTR_TP(10), RBBM_PERFCTR_TP(10)+1),
530       COUNTER(TPL1_PERFCTR_TP_SEL(11), RBBM_PERFCTR_TP(11), RBBM_PERFCTR_TP(11)+1),
531 };
532 
533 static const struct fd_perfcntr_countable tp_countables[] = {
534       COUNTABLE(PERF_TP_BUSY_CYCLES, UINT64, AVERAGE),
535       COUNTABLE(PERF_TP_STALL_CYCLES_UCHE, UINT64, AVERAGE),
536       COUNTABLE(PERF_TP_LATENCY_CYCLES, UINT64, AVERAGE),
537       COUNTABLE(PERF_TP_LATENCY_TRANS, UINT64, AVERAGE),
538       COUNTABLE(PERF_TP_FLAG_CACHE_REQUEST_SAMPLES, UINT64, AVERAGE),
539       COUNTABLE(PERF_TP_FLAG_CACHE_REQUEST_LATENCY, UINT64, AVERAGE),
540       COUNTABLE(PERF_TP_L1_CACHELINE_REQUESTS, UINT64, AVERAGE),
541       COUNTABLE(PERF_TP_L1_CACHELINE_MISSES, UINT64, AVERAGE),
542       COUNTABLE(PERF_TP_SP_TP_TRANS, UINT64, AVERAGE),
543       COUNTABLE(PERF_TP_TP_SP_TRANS, UINT64, AVERAGE),
544       COUNTABLE(PERF_TP_OUTPUT_PIXELS, UINT64, AVERAGE),
545       COUNTABLE(PERF_TP_FILTER_WORKLOAD_16BIT, UINT64, AVERAGE),
546       COUNTABLE(PERF_TP_FILTER_WORKLOAD_32BIT, UINT64, AVERAGE),
547       COUNTABLE(PERF_TP_QUADS_RECEIVED, UINT64, AVERAGE),
548       COUNTABLE(PERF_TP_QUADS_OFFSET, UINT64, AVERAGE),
549       COUNTABLE(PERF_TP_QUADS_SHADOW, UINT64, AVERAGE),
550       COUNTABLE(PERF_TP_QUADS_ARRAY, UINT64, AVERAGE),
551       COUNTABLE(PERF_TP_QUADS_GRADIENT, UINT64, AVERAGE),
552       COUNTABLE(PERF_TP_QUADS_1D, UINT64, AVERAGE),
553       COUNTABLE(PERF_TP_QUADS_2D, UINT64, AVERAGE),
554       COUNTABLE(PERF_TP_QUADS_BUFFER, UINT64, AVERAGE),
555       COUNTABLE(PERF_TP_QUADS_3D, UINT64, AVERAGE),
556       COUNTABLE(PERF_TP_QUADS_CUBE, UINT64, AVERAGE),
557       COUNTABLE(PERF_TP_DIVERGENT_QUADS_RECEIVED, UINT64, AVERAGE),
558       COUNTABLE(PERF_TP_PRT_NON_RESIDENT_EVENTS, UINT64, AVERAGE),
559       COUNTABLE(PERF_TP_OUTPUT_PIXELS_POINT, UINT64, AVERAGE),
560       COUNTABLE(PERF_TP_OUTPUT_PIXELS_BILINEAR, UINT64, AVERAGE),
561       COUNTABLE(PERF_TP_OUTPUT_PIXELS_MIP, UINT64, AVERAGE),
562       COUNTABLE(PERF_TP_OUTPUT_PIXELS_ANISO, UINT64, AVERAGE),
563       COUNTABLE(PERF_TP_OUTPUT_PIXELS_ZERO_LOD, UINT64, AVERAGE),
564       COUNTABLE(PERF_TP_FLAG_CACHE_REQUESTS, UINT64, AVERAGE),
565       COUNTABLE(PERF_TP_FLAG_CACHE_MISSES, UINT64, AVERAGE),
566       COUNTABLE(PERF_TP_L1_5_L2_REQUESTS, UINT64, AVERAGE),
567       COUNTABLE(PERF_TP_2D_OUTPUT_PIXELS, UINT64, AVERAGE),
568       COUNTABLE(PERF_TP_2D_OUTPUT_PIXELS_POINT, UINT64, AVERAGE),
569       COUNTABLE(PERF_TP_2D_OUTPUT_PIXELS_BILINEAR, UINT64, AVERAGE),
570       COUNTABLE(PERF_TP_2D_FILTER_WORKLOAD_16BIT, UINT64, AVERAGE),
571       COUNTABLE(PERF_TP_2D_FILTER_WORKLOAD_32BIT, UINT64, AVERAGE),
572       COUNTABLE(PERF_TP_TPA2TPC_TRANS, UINT64, AVERAGE),
573       COUNTABLE(PERF_TP_L1_MISSES_ASTC_1TILE, UINT64, AVERAGE),
574       COUNTABLE(PERF_TP_L1_MISSES_ASTC_2TILE, UINT64, AVERAGE),
575       COUNTABLE(PERF_TP_L1_MISSES_ASTC_4TILE, UINT64, AVERAGE),
576       COUNTABLE(PERF_TP_L1_5_L2_COMPRESS_REQS, UINT64, AVERAGE),
577       COUNTABLE(PERF_TP_L1_5_L2_COMPRESS_MISS, UINT64, AVERAGE),
578       COUNTABLE(PERF_TP_L1_BANK_CONFLICT, UINT64, AVERAGE),
579       COUNTABLE(PERF_TP_L1_5_MISS_LATENCY_CYCLES, UINT64, AVERAGE),
580       COUNTABLE(PERF_TP_L1_5_MISS_LATENCY_TRANS, UINT64, AVERAGE),
581       COUNTABLE(PERF_TP_QUADS_CONSTANT_MULTIPLIED, UINT64, AVERAGE),
582       COUNTABLE(PERF_TP_FRONTEND_WORKING_CYCLES, UINT64, AVERAGE),
583       COUNTABLE(PERF_TP_L1_TAG_WORKING_CYCLES, UINT64, AVERAGE),
584       COUNTABLE(PERF_TP_L1_DATA_WRITE_WORKING_CYCLES, UINT64, AVERAGE),
585       COUNTABLE(PERF_TP_PRE_L1_DECOM_WORKING_CYCLES, UINT64, AVERAGE),
586       COUNTABLE(PERF_TP_BACKEND_WORKING_CYCLES, UINT64, AVERAGE),
587       COUNTABLE(PERF_TP_FLAG_CACHE_WORKING_CYCLES, UINT64, AVERAGE),
588       COUNTABLE(PERF_TP_L1_5_CACHE_WORKING_CYCLES, UINT64, AVERAGE),
589       COUNTABLE(PERF_TP_STARVE_CYCLES_SP, UINT64, AVERAGE),
590       COUNTABLE(PERF_TP_STARVE_CYCLES_UCHE, UINT64, AVERAGE),
591 };
592 
593 static const struct fd_perfcntr_counter uche_counters[] = {
594       COUNTER(UCHE_PERFCTR_UCHE_SEL(0),  RBBM_PERFCTR_UCHE(0),  RBBM_PERFCTR_UCHE(0)+1),
595       COUNTER(UCHE_PERFCTR_UCHE_SEL(1),  RBBM_PERFCTR_UCHE(1),  RBBM_PERFCTR_UCHE(1)+1),
596       COUNTER(UCHE_PERFCTR_UCHE_SEL(2),  RBBM_PERFCTR_UCHE(2),  RBBM_PERFCTR_UCHE(2)+1),
597       COUNTER(UCHE_PERFCTR_UCHE_SEL(3),  RBBM_PERFCTR_UCHE(3),  RBBM_PERFCTR_UCHE(3)+1),
598       COUNTER(UCHE_PERFCTR_UCHE_SEL(4),  RBBM_PERFCTR_UCHE(4),  RBBM_PERFCTR_UCHE(4)+1),
599       COUNTER(UCHE_PERFCTR_UCHE_SEL(5),  RBBM_PERFCTR_UCHE(5),  RBBM_PERFCTR_UCHE(5)+1),
600       COUNTER(UCHE_PERFCTR_UCHE_SEL(6),  RBBM_PERFCTR_UCHE(6),  RBBM_PERFCTR_UCHE(6)+1),
601       COUNTER(UCHE_PERFCTR_UCHE_SEL(7),  RBBM_PERFCTR_UCHE(7),  RBBM_PERFCTR_UCHE(7)+1),
602       COUNTER(UCHE_PERFCTR_UCHE_SEL(8),  RBBM_PERFCTR_UCHE(8),  RBBM_PERFCTR_UCHE(8)+1),
603       COUNTER(UCHE_PERFCTR_UCHE_SEL(9),  RBBM_PERFCTR_UCHE(9),  RBBM_PERFCTR_UCHE(9)+1),
604       COUNTER(UCHE_PERFCTR_UCHE_SEL(10), RBBM_PERFCTR_UCHE(10), RBBM_PERFCTR_UCHE(10)+1),
605       COUNTER(UCHE_PERFCTR_UCHE_SEL(11), RBBM_PERFCTR_UCHE(11), RBBM_PERFCTR_UCHE(11)+1),
606 };
607 
608 static const struct fd_perfcntr_countable uche_countables[] = {
609       COUNTABLE(PERF_UCHE_BUSY_CYCLES, UINT64, AVERAGE),
610       COUNTABLE(PERF_UCHE_STALL_CYCLES_ARBITER, UINT64, AVERAGE),
611       COUNTABLE(PERF_UCHE_VBIF_LATENCY_CYCLES, UINT64, AVERAGE),
612       COUNTABLE(PERF_UCHE_VBIF_LATENCY_SAMPLES, UINT64, AVERAGE),
613       COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_TP, UINT64, AVERAGE),
614       COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_VFD, UINT64, AVERAGE),
615       COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_HLSQ, UINT64, AVERAGE),
616       COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_LRZ, UINT64, AVERAGE),
617       COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_SP, UINT64, AVERAGE),
618       COUNTABLE(PERF_UCHE_READ_REQUESTS_TP, UINT64, AVERAGE),
619       COUNTABLE(PERF_UCHE_READ_REQUESTS_VFD, UINT64, AVERAGE),
620       COUNTABLE(PERF_UCHE_READ_REQUESTS_HLSQ, UINT64, AVERAGE),
621       COUNTABLE(PERF_UCHE_READ_REQUESTS_LRZ, UINT64, AVERAGE),
622       COUNTABLE(PERF_UCHE_READ_REQUESTS_SP, UINT64, AVERAGE),
623       COUNTABLE(PERF_UCHE_WRITE_REQUESTS_LRZ, UINT64, AVERAGE),
624       COUNTABLE(PERF_UCHE_WRITE_REQUESTS_SP, UINT64, AVERAGE),
625       COUNTABLE(PERF_UCHE_WRITE_REQUESTS_VPC, UINT64, AVERAGE),
626       COUNTABLE(PERF_UCHE_WRITE_REQUESTS_VSC, UINT64, AVERAGE),
627       COUNTABLE(PERF_UCHE_EVICTS, UINT64, AVERAGE),
628       COUNTABLE(PERF_UCHE_BANK_REQ0, UINT64, AVERAGE),
629       COUNTABLE(PERF_UCHE_BANK_REQ1, UINT64, AVERAGE),
630       COUNTABLE(PERF_UCHE_BANK_REQ2, UINT64, AVERAGE),
631       COUNTABLE(PERF_UCHE_BANK_REQ3, UINT64, AVERAGE),
632       COUNTABLE(PERF_UCHE_BANK_REQ4, UINT64, AVERAGE),
633       COUNTABLE(PERF_UCHE_BANK_REQ5, UINT64, AVERAGE),
634       COUNTABLE(PERF_UCHE_BANK_REQ6, UINT64, AVERAGE),
635       COUNTABLE(PERF_UCHE_BANK_REQ7, UINT64, AVERAGE),
636       COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_CH0, UINT64, AVERAGE),
637       COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_CH1, UINT64, AVERAGE),
638       COUNTABLE(PERF_UCHE_GMEM_READ_BEATS, UINT64, AVERAGE),
639       COUNTABLE(PERF_UCHE_TPH_REF_FULL, UINT64, AVERAGE),
640       COUNTABLE(PERF_UCHE_TPH_VICTIM_FULL, UINT64, AVERAGE),
641       COUNTABLE(PERF_UCHE_TPH_EXT_FULL, UINT64, AVERAGE),
642       COUNTABLE(PERF_UCHE_VBIF_STALL_WRITE_DATA, UINT64, AVERAGE),
643       COUNTABLE(PERF_UCHE_DCMP_LATENCY_SAMPLES, UINT64, AVERAGE),
644       COUNTABLE(PERF_UCHE_DCMP_LATENCY_CYCLES, UINT64, AVERAGE),
645       COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_PC, UINT64, AVERAGE),
646       COUNTABLE(PERF_UCHE_READ_REQUESTS_PC, UINT64, AVERAGE),
647       COUNTABLE(PERF_UCHE_RAM_READ_REQ, UINT64, AVERAGE),
648       COUNTABLE(PERF_UCHE_RAM_WRITE_REQ, UINT64, AVERAGE),
649 };
650 
651 static const struct fd_perfcntr_counter vfd_counters[] = {
652       COUNTER(VFD_PERFCTR_VFD_SEL(0), RBBM_PERFCTR_VFD(0), RBBM_PERFCTR_VFD(0)+1),
653       COUNTER(VFD_PERFCTR_VFD_SEL(1), RBBM_PERFCTR_VFD(1), RBBM_PERFCTR_VFD(1)+1),
654       COUNTER(VFD_PERFCTR_VFD_SEL(2), RBBM_PERFCTR_VFD(2), RBBM_PERFCTR_VFD(2)+1),
655       COUNTER(VFD_PERFCTR_VFD_SEL(3), RBBM_PERFCTR_VFD(3), RBBM_PERFCTR_VFD(3)+1),
656       COUNTER(VFD_PERFCTR_VFD_SEL(4), RBBM_PERFCTR_VFD(4), RBBM_PERFCTR_VFD(4)+1),
657       COUNTER(VFD_PERFCTR_VFD_SEL(5), RBBM_PERFCTR_VFD(5), RBBM_PERFCTR_VFD(5)+1),
658       COUNTER(VFD_PERFCTR_VFD_SEL(6), RBBM_PERFCTR_VFD(6), RBBM_PERFCTR_VFD(6)+1),
659       COUNTER(VFD_PERFCTR_VFD_SEL(7), RBBM_PERFCTR_VFD(7), RBBM_PERFCTR_VFD(7)+1),
660 };
661 
662 static const struct fd_perfcntr_countable vfd_countables[] = {
663       COUNTABLE(PERF_VFD_BUSY_CYCLES, UINT64, AVERAGE),
664       COUNTABLE(PERF_VFD_STALL_CYCLES_UCHE, UINT64, AVERAGE),
665       COUNTABLE(PERF_VFD_STALL_CYCLES_VPC_ALLOC, UINT64, AVERAGE),
666       COUNTABLE(PERF_VFD_STALL_CYCLES_SP_INFO, UINT64, AVERAGE),
667       COUNTABLE(PERF_VFD_STALL_CYCLES_SP_ATTR, UINT64, AVERAGE),
668       COUNTABLE(PERF_VFD_STARVE_CYCLES_UCHE, UINT64, AVERAGE),
669       COUNTABLE(PERF_VFD_RBUFFER_FULL, UINT64, AVERAGE),
670       COUNTABLE(PERF_VFD_ATTR_INFO_FIFO_FULL, UINT64, AVERAGE),
671       COUNTABLE(PERF_VFD_DECODED_ATTRIBUTE_BYTES, UINT64, AVERAGE),
672       COUNTABLE(PERF_VFD_NUM_ATTRIBUTES, UINT64, AVERAGE),
673       COUNTABLE(PERF_VFD_UPPER_SHADER_FIBERS, UINT64, AVERAGE),
674       COUNTABLE(PERF_VFD_LOWER_SHADER_FIBERS, UINT64, AVERAGE),
675       COUNTABLE(PERF_VFD_MODE_0_FIBERS, UINT64, AVERAGE),
676       COUNTABLE(PERF_VFD_MODE_1_FIBERS, UINT64, AVERAGE),
677       COUNTABLE(PERF_VFD_MODE_2_FIBERS, UINT64, AVERAGE),
678       COUNTABLE(PERF_VFD_MODE_3_FIBERS, UINT64, AVERAGE),
679       COUNTABLE(PERF_VFD_MODE_4_FIBERS, UINT64, AVERAGE),
680       COUNTABLE(PERF_VFD_TOTAL_VERTICES, UINT64, AVERAGE),
681       COUNTABLE(PERF_VFDP_STALL_CYCLES_VFD, UINT64, AVERAGE),
682       COUNTABLE(PERF_VFDP_STALL_CYCLES_VFD_INDEX, UINT64, AVERAGE),
683       COUNTABLE(PERF_VFDP_STALL_CYCLES_VFD_PROG, UINT64, AVERAGE),
684       COUNTABLE(PERF_VFDP_STARVE_CYCLES_PC, UINT64, AVERAGE),
685       COUNTABLE(PERF_VFDP_VS_STAGE_WAVES, UINT64, AVERAGE),
686 };
687 
688 static const struct fd_perfcntr_counter vpc_counters[] = {
689       COUNTER(VPC_PERFCTR_VPC_SEL(0), RBBM_PERFCTR_VPC(0), RBBM_PERFCTR_VPC(0)+1),
690       COUNTER(VPC_PERFCTR_VPC_SEL(1), RBBM_PERFCTR_VPC(1), RBBM_PERFCTR_VPC(1)+1),
691       COUNTER(VPC_PERFCTR_VPC_SEL(2), RBBM_PERFCTR_VPC(2), RBBM_PERFCTR_VPC(2)+1),
692       COUNTER(VPC_PERFCTR_VPC_SEL(3), RBBM_PERFCTR_VPC(3), RBBM_PERFCTR_VPC(3)+1),
693       COUNTER(VPC_PERFCTR_VPC_SEL(4), RBBM_PERFCTR_VPC(4), RBBM_PERFCTR_VPC(4)+1),
694       COUNTER(VPC_PERFCTR_VPC_SEL(5), RBBM_PERFCTR_VPC(5), RBBM_PERFCTR_VPC(5)+1),
695 };
696 
697 static const struct fd_perfcntr_countable vpc_countables[] = {
698       COUNTABLE(PERF_VPC_BUSY_CYCLES, UINT64, AVERAGE),
699       COUNTABLE(PERF_VPC_WORKING_CYCLES, UINT64, AVERAGE),
700       COUNTABLE(PERF_VPC_STALL_CYCLES_UCHE, UINT64, AVERAGE),
701       COUNTABLE(PERF_VPC_STALL_CYCLES_VFD_WACK, UINT64, AVERAGE),
702       COUNTABLE(PERF_VPC_STALL_CYCLES_HLSQ_PRIM_ALLOC, UINT64, AVERAGE),
703       COUNTABLE(PERF_VPC_STALL_CYCLES_PC, UINT64, AVERAGE),
704       COUNTABLE(PERF_VPC_STALL_CYCLES_SP_LM, UINT64, AVERAGE),
705       COUNTABLE(PERF_VPC_STARVE_CYCLES_SP, UINT64, AVERAGE),
706       COUNTABLE(PERF_VPC_STARVE_CYCLES_LRZ, UINT64, AVERAGE),
707       COUNTABLE(PERF_VPC_PC_PRIMITIVES, UINT64, AVERAGE),
708       COUNTABLE(PERF_VPC_SP_COMPONENTS, UINT64, AVERAGE),
709       COUNTABLE(PERF_VPC_STALL_CYCLES_VPCRAM_POS, UINT64, AVERAGE),
710       COUNTABLE(PERF_VPC_LRZ_ASSIGN_PRIMITIVES, UINT64, AVERAGE),
711       COUNTABLE(PERF_VPC_RB_VISIBLE_PRIMITIVES, UINT64, AVERAGE),
712       COUNTABLE(PERF_VPC_LM_TRANSACTION, UINT64, AVERAGE),
713       COUNTABLE(PERF_VPC_STREAMOUT_TRANSACTION, UINT64, AVERAGE),
714       COUNTABLE(PERF_VPC_VS_BUSY_CYCLES, UINT64, AVERAGE),
715       COUNTABLE(PERF_VPC_PS_BUSY_CYCLES, UINT64, AVERAGE),
716       COUNTABLE(PERF_VPC_VS_WORKING_CYCLES, UINT64, AVERAGE),
717       COUNTABLE(PERF_VPC_PS_WORKING_CYCLES, UINT64, AVERAGE),
718       COUNTABLE(PERF_VPC_STARVE_CYCLES_RB, UINT64, AVERAGE),
719       COUNTABLE(PERF_VPC_NUM_VPCRAM_READ_POS, UINT64, AVERAGE),
720       COUNTABLE(PERF_VPC_WIT_FULL_CYCLES, UINT64, AVERAGE),
721       COUNTABLE(PERF_VPC_VPCRAM_FULL_CYCLES, UINT64, AVERAGE),
722       COUNTABLE(PERF_VPC_LM_FULL_WAIT_FOR_INTP_END, UINT64, AVERAGE),
723       COUNTABLE(PERF_VPC_NUM_VPCRAM_WRITE, UINT64, AVERAGE),
724       COUNTABLE(PERF_VPC_NUM_VPCRAM_READ_SO, UINT64, AVERAGE),
725       COUNTABLE(PERF_VPC_NUM_ATTR_REQ_LM, UINT64, AVERAGE),
726 };
727 
728 static const struct fd_perfcntr_counter vsc_counters[] = {
729       COUNTER(VSC_PERFCTR_VSC_SEL(0), RBBM_PERFCTR_VSC(0), RBBM_PERFCTR_VSC(0)+1),
730       COUNTER(VSC_PERFCTR_VSC_SEL(1), RBBM_PERFCTR_VSC(1), RBBM_PERFCTR_VSC(1)+1),
731 };
732 
733 static const struct fd_perfcntr_countable vsc_countables[] = {
734       COUNTABLE(PERF_VSC_BUSY_CYCLES, UINT64, AVERAGE),
735       COUNTABLE(PERF_VSC_WORKING_CYCLES, UINT64, AVERAGE),
736       COUNTABLE(PERF_VSC_STALL_CYCLES_UCHE, UINT64, AVERAGE),
737       COUNTABLE(PERF_VSC_EOT_NUM, UINT64, AVERAGE),
738       COUNTABLE(PERF_VSC_INPUT_TILES, UINT64, AVERAGE),
739 };
740 
741 const struct fd_perfcntr_group a6xx_perfcntr_groups[] = {
742       GROUP("CP", cp_counters, cp_countables),
743       GROUP("CCU", ccu_counters, ccu_countables),
744       GROUP("TSE", tse_counters, tse_countables),
745       GROUP("RAS", ras_counters, ras_countables),
746       GROUP("LRZ", lrz_counters, lrz_countables),
747       GROUP("HLSQ", hlsq_counters, hlsq_countables),
748       GROUP("PC", pc_counters, pc_countables),
749       GROUP("RB", rb_counters, rb_countables),
750       //	GROUP("RBBM", rbbm_counters, rbbm_countables),
751       GROUP("SP", sp_counters, sp_countables),
752       GROUP("TP", tp_counters, tp_countables),
753       GROUP("UCHE", uche_counters, uche_countables),
754       GROUP("VFD", vfd_counters, vfd_countables),
755       GROUP("VPC", vpc_counters, vpc_countables),
756       GROUP("VSC", vsc_counters, vsc_countables),
757       //	GROUP("VBIF", vbif_counters, vbif_countables),
758 };
759 
760 const unsigned a6xx_num_perfcntr_groups = ARRAY_SIZE(a6xx_perfcntr_groups);
761 
762 #endif /* FD6_PERFCNTR_H_ */
763 
764