Path: blob/21.2-virgl/src/freedreno/perfcntrs/fd5_perfcntr.c
4565 views
/*1* Copyright (C) 2018 Rob Clark <[email protected]>2*3* Permission is hereby granted, free of charge, to any person obtaining a4* copy of this software and associated documentation files (the "Software"),5* to deal in the Software without restriction, including without limitation6* the rights to use, copy, modify, merge, publish, distribute, sublicense,7* and/or sell copies of the Software, and to permit persons to whom the8* Software is furnished to do so, subject to the following conditions:9*10* The above copyright notice and this permission notice (including the next11* paragraph) shall be included in all copies or substantial portions of the12* Software.13*14* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR15* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,16* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL17* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER18* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,19* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE20* SOFTWARE.21*22* Authors:23* Rob Clark <[email protected]>24*/2526#ifndef FD5_PERFCNTR_H_27#define FD5_PERFCNTR_H_2829#include "util/half_float.h"30#include "util/u_math.h"31#include "adreno_common.xml.h"32#include "a5xx.xml.h"3334#define REG(_x) REG_A5XX_ ## _x35#include "freedreno_perfcntr.h"3637static const struct fd_perfcntr_counter cp_counters[] = {38//RESERVED: for kernel39// COUNTER(CP_PERFCTR_CP_SEL_0, RBBM_PERFCTR_CP_0_LO, RBBM_PERFCTR_CP_0_HI),40COUNTER(CP_PERFCTR_CP_SEL_1, RBBM_PERFCTR_CP_1_LO, RBBM_PERFCTR_CP_1_HI),41COUNTER(CP_PERFCTR_CP_SEL_2, RBBM_PERFCTR_CP_2_LO, RBBM_PERFCTR_CP_2_HI),42COUNTER(CP_PERFCTR_CP_SEL_3, RBBM_PERFCTR_CP_3_LO, RBBM_PERFCTR_CP_3_HI),43COUNTER(CP_PERFCTR_CP_SEL_4, RBBM_PERFCTR_CP_4_LO, RBBM_PERFCTR_CP_4_HI),44COUNTER(CP_PERFCTR_CP_SEL_5, RBBM_PERFCTR_CP_5_LO, RBBM_PERFCTR_CP_5_HI),45COUNTER(CP_PERFCTR_CP_SEL_6, RBBM_PERFCTR_CP_6_LO, RBBM_PERFCTR_CP_6_HI),46COUNTER(CP_PERFCTR_CP_SEL_7, RBBM_PERFCTR_CP_7_LO, RBBM_PERFCTR_CP_7_HI),47};4849static const struct fd_perfcntr_countable cp_countables[] = {50COUNTABLE(PERF_CP_ALWAYS_COUNT, UINT64, AVERAGE),51COUNTABLE(PERF_CP_BUSY_GFX_CORE_IDLE, UINT64, AVERAGE),52COUNTABLE(PERF_CP_BUSY_CYCLES, UINT64, AVERAGE),53COUNTABLE(PERF_CP_PFP_IDLE, UINT64, AVERAGE),54COUNTABLE(PERF_CP_PFP_BUSY_WORKING, UINT64, AVERAGE),55COUNTABLE(PERF_CP_PFP_STALL_CYCLES_ANY, UINT64, AVERAGE),56COUNTABLE(PERF_CP_PFP_STARVE_CYCLES_ANY, UINT64, AVERAGE),57COUNTABLE(PERF_CP_PFP_ICACHE_MISS, UINT64, AVERAGE),58COUNTABLE(PERF_CP_PFP_ICACHE_HIT, UINT64, AVERAGE),59COUNTABLE(PERF_CP_PFP_MATCH_PM4_PKT_PROFILE, UINT64, AVERAGE),60COUNTABLE(PERF_CP_ME_BUSY_WORKING, UINT64, AVERAGE),61COUNTABLE(PERF_CP_ME_IDLE, UINT64, AVERAGE),62COUNTABLE(PERF_CP_ME_STARVE_CYCLES_ANY, UINT64, AVERAGE),63COUNTABLE(PERF_CP_ME_FIFO_EMPTY_PFP_IDLE, UINT64, AVERAGE),64COUNTABLE(PERF_CP_ME_FIFO_EMPTY_PFP_BUSY, UINT64, AVERAGE),65COUNTABLE(PERF_CP_ME_FIFO_FULL_ME_BUSY, UINT64, AVERAGE),66COUNTABLE(PERF_CP_ME_FIFO_FULL_ME_NON_WORKING, UINT64, AVERAGE),67COUNTABLE(PERF_CP_ME_STALL_CYCLES_ANY, UINT64, AVERAGE),68COUNTABLE(PERF_CP_ME_ICACHE_MISS, UINT64, AVERAGE),69COUNTABLE(PERF_CP_ME_ICACHE_HIT, UINT64, AVERAGE),70COUNTABLE(PERF_CP_NUM_PREEMPTIONS, UINT64, AVERAGE),71COUNTABLE(PERF_CP_PREEMPTION_REACTION_DELAY, UINT64, AVERAGE),72COUNTABLE(PERF_CP_PREEMPTION_SWITCH_OUT_TIME, UINT64, AVERAGE),73COUNTABLE(PERF_CP_PREEMPTION_SWITCH_IN_TIME, UINT64, AVERAGE),74COUNTABLE(PERF_CP_DEAD_DRAWS_IN_BIN_RENDER, UINT64, AVERAGE),75COUNTABLE(PERF_CP_PREDICATED_DRAWS_KILLED, UINT64, AVERAGE),76COUNTABLE(PERF_CP_MODE_SWITCH, UINT64, AVERAGE),77COUNTABLE(PERF_CP_ZPASS_DONE, UINT64, AVERAGE),78COUNTABLE(PERF_CP_CONTEXT_DONE, UINT64, AVERAGE),79COUNTABLE(PERF_CP_CACHE_FLUSH, UINT64, AVERAGE),80COUNTABLE(PERF_CP_LONG_PREEMPTIONS, UINT64, AVERAGE),81};8283static const struct fd_perfcntr_counter ccu_counters[] = {84COUNTER(RB_PERFCTR_CCU_SEL_0, RBBM_PERFCTR_CCU_0_LO, RBBM_PERFCTR_CCU_0_HI),85COUNTER(RB_PERFCTR_CCU_SEL_1, RBBM_PERFCTR_CCU_1_LO, RBBM_PERFCTR_CCU_1_HI),86COUNTER(RB_PERFCTR_CCU_SEL_2, RBBM_PERFCTR_CCU_2_LO, RBBM_PERFCTR_CCU_2_HI),87COUNTER(RB_PERFCTR_CCU_SEL_3, RBBM_PERFCTR_CCU_3_LO, RBBM_PERFCTR_CCU_3_HI),88};8990static const struct fd_perfcntr_countable ccu_countables[] = {91COUNTABLE(PERF_CCU_BUSY_CYCLES, UINT64, AVERAGE),92COUNTABLE(PERF_CCU_STALL_CYCLES_RB_DEPTH_RETURN, UINT64, AVERAGE),93COUNTABLE(PERF_CCU_STALL_CYCLES_RB_COLOR_RETURN, UINT64, AVERAGE),94COUNTABLE(PERF_CCU_STARVE_CYCLES_FLAG_RETURN, UINT64, AVERAGE),95COUNTABLE(PERF_CCU_DEPTH_BLOCKS, UINT64, AVERAGE),96COUNTABLE(PERF_CCU_COLOR_BLOCKS, UINT64, AVERAGE),97COUNTABLE(PERF_CCU_DEPTH_BLOCK_HIT, UINT64, AVERAGE),98COUNTABLE(PERF_CCU_COLOR_BLOCK_HIT, UINT64, AVERAGE),99COUNTABLE(PERF_CCU_PARTIAL_BLOCK_READ, UINT64, AVERAGE),100COUNTABLE(PERF_CCU_GMEM_READ, UINT64, AVERAGE),101COUNTABLE(PERF_CCU_GMEM_WRITE, UINT64, AVERAGE),102COUNTABLE(PERF_CCU_DEPTH_READ_FLAG0_COUNT, UINT64, AVERAGE),103COUNTABLE(PERF_CCU_DEPTH_READ_FLAG1_COUNT, UINT64, AVERAGE),104COUNTABLE(PERF_CCU_DEPTH_READ_FLAG2_COUNT, UINT64, AVERAGE),105COUNTABLE(PERF_CCU_DEPTH_READ_FLAG3_COUNT, UINT64, AVERAGE),106COUNTABLE(PERF_CCU_DEPTH_READ_FLAG4_COUNT, UINT64, AVERAGE),107COUNTABLE(PERF_CCU_COLOR_READ_FLAG0_COUNT, UINT64, AVERAGE),108COUNTABLE(PERF_CCU_COLOR_READ_FLAG1_COUNT, UINT64, AVERAGE),109COUNTABLE(PERF_CCU_COLOR_READ_FLAG2_COUNT, UINT64, AVERAGE),110COUNTABLE(PERF_CCU_COLOR_READ_FLAG3_COUNT, UINT64, AVERAGE),111COUNTABLE(PERF_CCU_COLOR_READ_FLAG4_COUNT, UINT64, AVERAGE),112COUNTABLE(PERF_CCU_2D_BUSY_CYCLES, UINT64, AVERAGE),113COUNTABLE(PERF_CCU_2D_RD_REQ, UINT64, AVERAGE),114COUNTABLE(PERF_CCU_2D_WR_REQ, UINT64, AVERAGE),115COUNTABLE(PERF_CCU_2D_REORDER_STARVE_CYCLES, UINT64, AVERAGE),116COUNTABLE(PERF_CCU_2D_PIXELS, UINT64, AVERAGE),117};118119static const struct fd_perfcntr_counter tse_counters[] = {120COUNTER(GRAS_PERFCTR_TSE_SEL_0, RBBM_PERFCTR_TSE_0_LO, RBBM_PERFCTR_TSE_0_HI),121COUNTER(GRAS_PERFCTR_TSE_SEL_1, RBBM_PERFCTR_TSE_1_LO, RBBM_PERFCTR_TSE_1_HI),122COUNTER(GRAS_PERFCTR_TSE_SEL_2, RBBM_PERFCTR_TSE_2_LO, RBBM_PERFCTR_TSE_2_HI),123COUNTER(GRAS_PERFCTR_TSE_SEL_3, RBBM_PERFCTR_TSE_3_LO, RBBM_PERFCTR_TSE_3_HI),124};125126static const struct fd_perfcntr_countable tse_countables[] = {127COUNTABLE(PERF_TSE_BUSY_CYCLES, UINT64, AVERAGE),128COUNTABLE(PERF_TSE_CLIPPING_CYCLES, UINT64, AVERAGE),129COUNTABLE(PERF_TSE_STALL_CYCLES_RAS, UINT64, AVERAGE),130COUNTABLE(PERF_TSE_STALL_CYCLES_LRZ_BARYPLANE, UINT64, AVERAGE),131COUNTABLE(PERF_TSE_STALL_CYCLES_LRZ_ZPLANE, UINT64, AVERAGE),132COUNTABLE(PERF_TSE_STARVE_CYCLES_PC, UINT64, AVERAGE),133COUNTABLE(PERF_TSE_INPUT_PRIM, UINT64, AVERAGE),134COUNTABLE(PERF_TSE_INPUT_NULL_PRIM, UINT64, AVERAGE),135COUNTABLE(PERF_TSE_TRIVAL_REJ_PRIM, UINT64, AVERAGE),136COUNTABLE(PERF_TSE_CLIPPED_PRIM, UINT64, AVERAGE),137COUNTABLE(PERF_TSE_ZERO_AREA_PRIM, UINT64, AVERAGE),138COUNTABLE(PERF_TSE_FACENESS_CULLED_PRIM, UINT64, AVERAGE),139COUNTABLE(PERF_TSE_ZERO_PIXEL_PRIM, UINT64, AVERAGE),140COUNTABLE(PERF_TSE_OUTPUT_NULL_PRIM, UINT64, AVERAGE),141COUNTABLE(PERF_TSE_OUTPUT_VISIBLE_PRIM, UINT64, AVERAGE),142COUNTABLE(PERF_TSE_CINVOCATION, UINT64, AVERAGE),143COUNTABLE(PERF_TSE_CPRIMITIVES, UINT64, AVERAGE),144COUNTABLE(PERF_TSE_2D_INPUT_PRIM, UINT64, AVERAGE),145COUNTABLE(PERF_TSE_2D_ALIVE_CLCLES, UINT64, AVERAGE),146};147148static const struct fd_perfcntr_counter ras_counters[] = {149COUNTER(GRAS_PERFCTR_RAS_SEL_0, RBBM_PERFCTR_RAS_0_LO, RBBM_PERFCTR_RAS_0_HI),150COUNTER(GRAS_PERFCTR_RAS_SEL_1, RBBM_PERFCTR_RAS_1_LO, RBBM_PERFCTR_RAS_1_HI),151COUNTER(GRAS_PERFCTR_RAS_SEL_2, RBBM_PERFCTR_RAS_2_LO, RBBM_PERFCTR_RAS_2_HI),152COUNTER(GRAS_PERFCTR_RAS_SEL_3, RBBM_PERFCTR_RAS_3_LO, RBBM_PERFCTR_RAS_3_HI),153};154155static const struct fd_perfcntr_countable ras_countables[] = {156COUNTABLE(PERF_RAS_BUSY_CYCLES, UINT64, AVERAGE),157COUNTABLE(PERF_RAS_SUPERTILE_ACTIVE_CYCLES, UINT64, AVERAGE),158COUNTABLE(PERF_RAS_STALL_CYCLES_LRZ, UINT64, AVERAGE),159COUNTABLE(PERF_RAS_STARVE_CYCLES_TSE, UINT64, AVERAGE),160COUNTABLE(PERF_RAS_SUPER_TILES, UINT64, AVERAGE),161COUNTABLE(PERF_RAS_8X4_TILES, UINT64, AVERAGE),162COUNTABLE(PERF_RAS_MASKGEN_ACTIVE, UINT64, AVERAGE),163COUNTABLE(PERF_RAS_FULLY_COVERED_SUPER_TILES, UINT64, AVERAGE),164COUNTABLE(PERF_RAS_FULLY_COVERED_8X4_TILES, UINT64, AVERAGE),165COUNTABLE(PERF_RAS_PRIM_KILLED_INVISILBE, UINT64, AVERAGE),166};167168static const struct fd_perfcntr_counter lrz_counters[] = {169COUNTER(GRAS_PERFCTR_LRZ_SEL_0, RBBM_PERFCTR_LRZ_0_LO, RBBM_PERFCTR_LRZ_0_HI),170COUNTER(GRAS_PERFCTR_LRZ_SEL_1, RBBM_PERFCTR_LRZ_1_LO, RBBM_PERFCTR_LRZ_1_HI),171COUNTER(GRAS_PERFCTR_LRZ_SEL_2, RBBM_PERFCTR_LRZ_2_LO, RBBM_PERFCTR_LRZ_2_HI),172COUNTER(GRAS_PERFCTR_LRZ_SEL_3, RBBM_PERFCTR_LRZ_3_LO, RBBM_PERFCTR_LRZ_3_HI),173};174175static const struct fd_perfcntr_countable lrz_countables[] = {176COUNTABLE(PERF_LRZ_BUSY_CYCLES, UINT64, AVERAGE),177COUNTABLE(PERF_LRZ_STARVE_CYCLES_RAS, UINT64, AVERAGE),178COUNTABLE(PERF_LRZ_STALL_CYCLES_RB, UINT64, AVERAGE),179COUNTABLE(PERF_LRZ_STALL_CYCLES_VSC, UINT64, AVERAGE),180COUNTABLE(PERF_LRZ_STALL_CYCLES_VPC, UINT64, AVERAGE),181COUNTABLE(PERF_LRZ_STALL_CYCLES_FLAG_PREFETCH, UINT64, AVERAGE),182COUNTABLE(PERF_LRZ_STALL_CYCLES_UCHE, UINT64, AVERAGE),183COUNTABLE(PERF_LRZ_LRZ_READ, UINT64, AVERAGE),184COUNTABLE(PERF_LRZ_LRZ_WRITE, UINT64, AVERAGE),185COUNTABLE(PERF_LRZ_READ_LATENCY, UINT64, AVERAGE),186COUNTABLE(PERF_LRZ_MERGE_CACHE_UPDATING, UINT64, AVERAGE),187COUNTABLE(PERF_LRZ_PRIM_KILLED_BY_MASKGEN, UINT64, AVERAGE),188COUNTABLE(PERF_LRZ_PRIM_KILLED_BY_LRZ, UINT64, AVERAGE),189COUNTABLE(PERF_LRZ_VISIBLE_PRIM_AFTER_LRZ, UINT64, AVERAGE),190COUNTABLE(PERF_LRZ_FULL_8X8_TILES, UINT64, AVERAGE),191COUNTABLE(PERF_LRZ_PARTIAL_8X8_TILES, UINT64, AVERAGE),192COUNTABLE(PERF_LRZ_TILE_KILLED, UINT64, AVERAGE),193COUNTABLE(PERF_LRZ_TOTAL_PIXEL, UINT64, AVERAGE),194COUNTABLE(PERF_LRZ_VISIBLE_PIXEL_AFTER_LRZ, UINT64, AVERAGE),195};196197static const struct fd_perfcntr_counter hlsq_counters[] = {198COUNTER(HLSQ_PERFCTR_HLSQ_SEL_0, RBBM_PERFCTR_HLSQ_0_LO, RBBM_PERFCTR_HLSQ_0_HI),199COUNTER(HLSQ_PERFCTR_HLSQ_SEL_1, RBBM_PERFCTR_HLSQ_1_LO, RBBM_PERFCTR_HLSQ_1_HI),200COUNTER(HLSQ_PERFCTR_HLSQ_SEL_2, RBBM_PERFCTR_HLSQ_2_LO, RBBM_PERFCTR_HLSQ_2_HI),201COUNTER(HLSQ_PERFCTR_HLSQ_SEL_3, RBBM_PERFCTR_HLSQ_3_LO, RBBM_PERFCTR_HLSQ_3_HI),202COUNTER(HLSQ_PERFCTR_HLSQ_SEL_4, RBBM_PERFCTR_HLSQ_4_LO, RBBM_PERFCTR_HLSQ_4_HI),203COUNTER(HLSQ_PERFCTR_HLSQ_SEL_5, RBBM_PERFCTR_HLSQ_5_LO, RBBM_PERFCTR_HLSQ_5_HI),204COUNTER(HLSQ_PERFCTR_HLSQ_SEL_6, RBBM_PERFCTR_HLSQ_6_LO, RBBM_PERFCTR_HLSQ_6_HI),205COUNTER(HLSQ_PERFCTR_HLSQ_SEL_7, RBBM_PERFCTR_HLSQ_7_LO, RBBM_PERFCTR_HLSQ_7_HI),206};207208static const struct fd_perfcntr_countable hlsq_countables[] = {209COUNTABLE(PERF_HLSQ_BUSY_CYCLES, UINT64, AVERAGE),210COUNTABLE(PERF_HLSQ_STALL_CYCLES_UCHE, UINT64, AVERAGE),211COUNTABLE(PERF_HLSQ_STALL_CYCLES_SP_STATE, UINT64, AVERAGE),212COUNTABLE(PERF_HLSQ_STALL_CYCLES_SP_FS_STAGE, UINT64, AVERAGE),213COUNTABLE(PERF_HLSQ_UCHE_LATENCY_CYCLES, UINT64, AVERAGE),214COUNTABLE(PERF_HLSQ_UCHE_LATENCY_COUNT, UINT64, AVERAGE),215COUNTABLE(PERF_HLSQ_FS_STAGE_32_WAVES, UINT64, AVERAGE),216COUNTABLE(PERF_HLSQ_FS_STAGE_64_WAVES, UINT64, AVERAGE),217COUNTABLE(PERF_HLSQ_QUADS, UINT64, AVERAGE),218COUNTABLE(PERF_HLSQ_SP_STATE_COPY_TRANS_FS_STAGE, UINT64, AVERAGE),219COUNTABLE(PERF_HLSQ_SP_STATE_COPY_TRANS_VS_STAGE, UINT64, AVERAGE),220COUNTABLE(PERF_HLSQ_TP_STATE_COPY_TRANS_FS_STAGE, UINT64, AVERAGE),221COUNTABLE(PERF_HLSQ_TP_STATE_COPY_TRANS_VS_STAGE, UINT64, AVERAGE),222COUNTABLE(PERF_HLSQ_CS_INVOCATIONS, UINT64, AVERAGE),223COUNTABLE(PERF_HLSQ_COMPUTE_DRAWCALLS, UINT64, AVERAGE),224};225226static const struct fd_perfcntr_counter pc_counters[] = {227COUNTER(PC_PERFCTR_PC_SEL_0, RBBM_PERFCTR_PC_0_LO, RBBM_PERFCTR_PC_0_HI),228COUNTER(PC_PERFCTR_PC_SEL_1, RBBM_PERFCTR_PC_1_LO, RBBM_PERFCTR_PC_1_HI),229COUNTER(PC_PERFCTR_PC_SEL_2, RBBM_PERFCTR_PC_2_LO, RBBM_PERFCTR_PC_2_HI),230COUNTER(PC_PERFCTR_PC_SEL_3, RBBM_PERFCTR_PC_3_LO, RBBM_PERFCTR_PC_3_HI),231COUNTER(PC_PERFCTR_PC_SEL_4, RBBM_PERFCTR_PC_4_LO, RBBM_PERFCTR_PC_4_HI),232COUNTER(PC_PERFCTR_PC_SEL_5, RBBM_PERFCTR_PC_5_LO, RBBM_PERFCTR_PC_5_HI),233COUNTER(PC_PERFCTR_PC_SEL_6, RBBM_PERFCTR_PC_6_LO, RBBM_PERFCTR_PC_6_HI),234COUNTER(PC_PERFCTR_PC_SEL_7, RBBM_PERFCTR_PC_7_LO, RBBM_PERFCTR_PC_7_HI),235};236237static const struct fd_perfcntr_countable pc_countables[] = {238COUNTABLE(PERF_PC_BUSY_CYCLES, UINT64, AVERAGE),239COUNTABLE(PERF_PC_WORKING_CYCLES, UINT64, AVERAGE),240COUNTABLE(PERF_PC_STALL_CYCLES_VFD, UINT64, AVERAGE),241COUNTABLE(PERF_PC_STALL_CYCLES_TSE, UINT64, AVERAGE),242COUNTABLE(PERF_PC_STALL_CYCLES_VPC, UINT64, AVERAGE),243COUNTABLE(PERF_PC_STALL_CYCLES_UCHE, UINT64, AVERAGE),244COUNTABLE(PERF_PC_STALL_CYCLES_TESS, UINT64, AVERAGE),245COUNTABLE(PERF_PC_STALL_CYCLES_TSE_ONLY, UINT64, AVERAGE),246COUNTABLE(PERF_PC_STALL_CYCLES_VPC_ONLY, UINT64, AVERAGE),247COUNTABLE(PERF_PC_PASS1_TF_STALL_CYCLES, UINT64, AVERAGE),248COUNTABLE(PERF_PC_STARVE_CYCLES_FOR_INDEX, UINT64, AVERAGE),249COUNTABLE(PERF_PC_STARVE_CYCLES_FOR_TESS_FACTOR, UINT64, AVERAGE),250COUNTABLE(PERF_PC_STARVE_CYCLES_FOR_VIZ_STREAM, UINT64, AVERAGE),251COUNTABLE(PERF_PC_STARVE_CYCLES_FOR_POSITION, UINT64, AVERAGE),252COUNTABLE(PERF_PC_STARVE_CYCLES_DI, UINT64, AVERAGE),253COUNTABLE(PERF_PC_VIS_STREAMS_LOADED, UINT64, AVERAGE),254COUNTABLE(PERF_PC_INSTANCES, UINT64, AVERAGE),255COUNTABLE(PERF_PC_VPC_PRIMITIVES, UINT64, AVERAGE),256COUNTABLE(PERF_PC_DEAD_PRIM, UINT64, AVERAGE),257COUNTABLE(PERF_PC_LIVE_PRIM, UINT64, AVERAGE),258COUNTABLE(PERF_PC_VERTEX_HITS, UINT64, AVERAGE),259COUNTABLE(PERF_PC_IA_VERTICES, UINT64, AVERAGE),260COUNTABLE(PERF_PC_IA_PRIMITIVES, UINT64, AVERAGE),261COUNTABLE(PERF_PC_GS_PRIMITIVES, UINT64, AVERAGE),262COUNTABLE(PERF_PC_HS_INVOCATIONS, UINT64, AVERAGE),263COUNTABLE(PERF_PC_DS_INVOCATIONS, UINT64, AVERAGE),264COUNTABLE(PERF_PC_VS_INVOCATIONS, UINT64, AVERAGE),265COUNTABLE(PERF_PC_GS_INVOCATIONS, UINT64, AVERAGE),266COUNTABLE(PERF_PC_DS_PRIMITIVES, UINT64, AVERAGE),267COUNTABLE(PERF_PC_VPC_POS_DATA_TRANSACTION, UINT64, AVERAGE),268COUNTABLE(PERF_PC_3D_DRAWCALLS, UINT64, AVERAGE),269COUNTABLE(PERF_PC_2D_DRAWCALLS, UINT64, AVERAGE),270COUNTABLE(PERF_PC_NON_DRAWCALL_GLOBAL_EVENTS, UINT64, AVERAGE),271COUNTABLE(PERF_TESS_BUSY_CYCLES, UINT64, AVERAGE),272COUNTABLE(PERF_TESS_WORKING_CYCLES, UINT64, AVERAGE),273COUNTABLE(PERF_TESS_STALL_CYCLES_PC, UINT64, AVERAGE),274COUNTABLE(PERF_TESS_STARVE_CYCLES_PC, UINT64, AVERAGE),275};276277static const struct fd_perfcntr_counter rb_counters[] = {278COUNTER(RB_PERFCTR_RB_SEL_0, RBBM_PERFCTR_RB_0_LO, RBBM_PERFCTR_RB_0_HI),279COUNTER(RB_PERFCTR_RB_SEL_1, RBBM_PERFCTR_RB_1_LO, RBBM_PERFCTR_RB_1_HI),280COUNTER(RB_PERFCTR_RB_SEL_2, RBBM_PERFCTR_RB_2_LO, RBBM_PERFCTR_RB_2_HI),281COUNTER(RB_PERFCTR_RB_SEL_3, RBBM_PERFCTR_RB_3_LO, RBBM_PERFCTR_RB_3_HI),282COUNTER(RB_PERFCTR_RB_SEL_4, RBBM_PERFCTR_RB_4_LO, RBBM_PERFCTR_RB_4_HI),283COUNTER(RB_PERFCTR_RB_SEL_5, RBBM_PERFCTR_RB_5_LO, RBBM_PERFCTR_RB_5_HI),284COUNTER(RB_PERFCTR_RB_SEL_6, RBBM_PERFCTR_RB_6_LO, RBBM_PERFCTR_RB_6_HI),285COUNTER(RB_PERFCTR_RB_SEL_7, RBBM_PERFCTR_RB_7_LO, RBBM_PERFCTR_RB_7_HI),286};287288static const struct fd_perfcntr_countable rb_countables[] = {289COUNTABLE(PERF_RB_BUSY_CYCLES, UINT64, AVERAGE),290COUNTABLE(PERF_RB_STALL_CYCLES_CCU, UINT64, AVERAGE),291COUNTABLE(PERF_RB_STALL_CYCLES_HLSQ, UINT64, AVERAGE),292COUNTABLE(PERF_RB_STALL_CYCLES_FIFO0_FULL, UINT64, AVERAGE),293COUNTABLE(PERF_RB_STALL_CYCLES_FIFO1_FULL, UINT64, AVERAGE),294COUNTABLE(PERF_RB_STALL_CYCLES_FIFO2_FULL, UINT64, AVERAGE),295COUNTABLE(PERF_RB_STARVE_CYCLES_SP, UINT64, AVERAGE),296COUNTABLE(PERF_RB_STARVE_CYCLES_LRZ_TILE, UINT64, AVERAGE),297COUNTABLE(PERF_RB_STARVE_CYCLES_CCU, UINT64, AVERAGE),298COUNTABLE(PERF_RB_STARVE_CYCLES_Z_PLANE, UINT64, AVERAGE),299COUNTABLE(PERF_RB_STARVE_CYCLES_BARY_PLANE, UINT64, AVERAGE),300COUNTABLE(PERF_RB_Z_WORKLOAD, UINT64, AVERAGE),301COUNTABLE(PERF_RB_HLSQ_ACTIVE, UINT64, AVERAGE),302COUNTABLE(PERF_RB_Z_READ, UINT64, AVERAGE),303COUNTABLE(PERF_RB_Z_WRITE, UINT64, AVERAGE),304COUNTABLE(PERF_RB_C_READ, UINT64, AVERAGE),305COUNTABLE(PERF_RB_C_WRITE, UINT64, AVERAGE),306COUNTABLE(PERF_RB_TOTAL_PASS, UINT64, AVERAGE),307COUNTABLE(PERF_RB_Z_PASS, UINT64, AVERAGE),308COUNTABLE(PERF_RB_Z_FAIL, UINT64, AVERAGE),309COUNTABLE(PERF_RB_S_FAIL, UINT64, AVERAGE),310COUNTABLE(PERF_RB_BLENDED_FXP_COMPONENTS, UINT64, AVERAGE),311COUNTABLE(PERF_RB_BLENDED_FP16_COMPONENTS, UINT64, AVERAGE),312COUNTABLE(RB_RESERVED, UINT64, AVERAGE),313COUNTABLE(PERF_RB_2D_ALIVE_CYCLES, UINT64, AVERAGE),314COUNTABLE(PERF_RB_2D_STALL_CYCLES_A2D, UINT64, AVERAGE),315COUNTABLE(PERF_RB_2D_STARVE_CYCLES_SRC, UINT64, AVERAGE),316COUNTABLE(PERF_RB_2D_STARVE_CYCLES_SP, UINT64, AVERAGE),317COUNTABLE(PERF_RB_2D_STARVE_CYCLES_DST, UINT64, AVERAGE),318COUNTABLE(PERF_RB_2D_VALID_PIXELS, UINT64, AVERAGE),319};320321static const struct fd_perfcntr_counter rbbm_counters[] = {322//RESERVED: for kernel323// COUNTER(RBBM_PERFCTR_RBBM_SEL_0, RBBM_PERFCTR_RBBM_0_LO, RBBM_PERFCTR_RBBM_0_HI),324COUNTER(RBBM_PERFCTR_RBBM_SEL_1, RBBM_PERFCTR_RBBM_1_LO, RBBM_PERFCTR_RBBM_1_HI),325COUNTER(RBBM_PERFCTR_RBBM_SEL_2, RBBM_PERFCTR_RBBM_2_LO, RBBM_PERFCTR_RBBM_2_HI),326COUNTER(RBBM_PERFCTR_RBBM_SEL_3, RBBM_PERFCTR_RBBM_3_LO, RBBM_PERFCTR_RBBM_3_HI),327};328329static const struct fd_perfcntr_countable rbbm_countables[] = {330COUNTABLE(PERF_RBBM_ALWAYS_COUNT, UINT64, AVERAGE),331COUNTABLE(PERF_RBBM_ALWAYS_ON, UINT64, AVERAGE),332COUNTABLE(PERF_RBBM_TSE_BUSY, UINT64, AVERAGE),333COUNTABLE(PERF_RBBM_RAS_BUSY, UINT64, AVERAGE),334COUNTABLE(PERF_RBBM_PC_DCALL_BUSY, UINT64, AVERAGE),335COUNTABLE(PERF_RBBM_PC_VSD_BUSY, UINT64, AVERAGE),336COUNTABLE(PERF_RBBM_STATUS_MASKED, UINT64, AVERAGE),337COUNTABLE(PERF_RBBM_COM_BUSY, UINT64, AVERAGE),338COUNTABLE(PERF_RBBM_DCOM_BUSY, UINT64, AVERAGE),339COUNTABLE(PERF_RBBM_VBIF_BUSY, UINT64, AVERAGE),340COUNTABLE(PERF_RBBM_VSC_BUSY, UINT64, AVERAGE),341COUNTABLE(PERF_RBBM_TESS_BUSY, UINT64, AVERAGE),342COUNTABLE(PERF_RBBM_UCHE_BUSY, UINT64, AVERAGE),343COUNTABLE(PERF_RBBM_HLSQ_BUSY, UINT64, AVERAGE),344};345346static const struct fd_perfcntr_counter sp_counters[] = {347//RESERVED: for kernel348// COUNTER(SP_PERFCTR_SP_SEL_0, RBBM_PERFCTR_SP_0_LO, RBBM_PERFCTR_SP_0_HI),349COUNTER(SP_PERFCTR_SP_SEL_1, RBBM_PERFCTR_SP_1_LO, RBBM_PERFCTR_SP_1_HI),350COUNTER(SP_PERFCTR_SP_SEL_2, RBBM_PERFCTR_SP_2_LO, RBBM_PERFCTR_SP_2_HI),351COUNTER(SP_PERFCTR_SP_SEL_3, RBBM_PERFCTR_SP_3_LO, RBBM_PERFCTR_SP_3_HI),352COUNTER(SP_PERFCTR_SP_SEL_4, RBBM_PERFCTR_SP_4_LO, RBBM_PERFCTR_SP_4_HI),353COUNTER(SP_PERFCTR_SP_SEL_5, RBBM_PERFCTR_SP_5_LO, RBBM_PERFCTR_SP_5_HI),354COUNTER(SP_PERFCTR_SP_SEL_6, RBBM_PERFCTR_SP_6_LO, RBBM_PERFCTR_SP_6_HI),355COUNTER(SP_PERFCTR_SP_SEL_7, RBBM_PERFCTR_SP_7_LO, RBBM_PERFCTR_SP_7_HI),356COUNTER(SP_PERFCTR_SP_SEL_8, RBBM_PERFCTR_SP_8_LO, RBBM_PERFCTR_SP_8_HI),357COUNTER(SP_PERFCTR_SP_SEL_9, RBBM_PERFCTR_SP_9_LO, RBBM_PERFCTR_SP_9_HI),358COUNTER(SP_PERFCTR_SP_SEL_10, RBBM_PERFCTR_SP_10_LO, RBBM_PERFCTR_SP_10_HI),359COUNTER(SP_PERFCTR_SP_SEL_11, RBBM_PERFCTR_SP_11_LO, RBBM_PERFCTR_SP_11_HI),360};361362static const struct fd_perfcntr_countable sp_countables[] = {363COUNTABLE(PERF_SP_BUSY_CYCLES, UINT64, AVERAGE),364COUNTABLE(PERF_SP_ALU_WORKING_CYCLES, UINT64, AVERAGE),365COUNTABLE(PERF_SP_EFU_WORKING_CYCLES, UINT64, AVERAGE),366COUNTABLE(PERF_SP_STALL_CYCLES_VPC, UINT64, AVERAGE),367COUNTABLE(PERF_SP_STALL_CYCLES_TP, UINT64, AVERAGE),368COUNTABLE(PERF_SP_STALL_CYCLES_UCHE, UINT64, AVERAGE),369COUNTABLE(PERF_SP_STALL_CYCLES_RB, UINT64, AVERAGE),370COUNTABLE(PERF_SP_SCHEDULER_NON_WORKING, UINT64, AVERAGE),371COUNTABLE(PERF_SP_WAVE_CONTEXTS, UINT64, AVERAGE),372COUNTABLE(PERF_SP_WAVE_CONTEXT_CYCLES, UINT64, AVERAGE),373COUNTABLE(PERF_SP_FS_STAGE_WAVE_CYCLES, UINT64, AVERAGE),374COUNTABLE(PERF_SP_FS_STAGE_WAVE_SAMPLES, UINT64, AVERAGE),375COUNTABLE(PERF_SP_VS_STAGE_WAVE_CYCLES, UINT64, AVERAGE),376COUNTABLE(PERF_SP_VS_STAGE_WAVE_SAMPLES, UINT64, AVERAGE),377COUNTABLE(PERF_SP_FS_STAGE_DURATION_CYCLES, UINT64, AVERAGE),378COUNTABLE(PERF_SP_VS_STAGE_DURATION_CYCLES, UINT64, AVERAGE),379COUNTABLE(PERF_SP_WAVE_CTRL_CYCLES, UINT64, AVERAGE),380COUNTABLE(PERF_SP_WAVE_LOAD_CYCLES, UINT64, AVERAGE),381COUNTABLE(PERF_SP_WAVE_EMIT_CYCLES, UINT64, AVERAGE),382COUNTABLE(PERF_SP_WAVE_NOP_CYCLES, UINT64, AVERAGE),383COUNTABLE(PERF_SP_WAVE_WAIT_CYCLES, UINT64, AVERAGE),384COUNTABLE(PERF_SP_WAVE_FETCH_CYCLES, UINT64, AVERAGE),385COUNTABLE(PERF_SP_WAVE_IDLE_CYCLES, UINT64, AVERAGE),386COUNTABLE(PERF_SP_WAVE_END_CYCLES, UINT64, AVERAGE),387COUNTABLE(PERF_SP_WAVE_LONG_SYNC_CYCLES, UINT64, AVERAGE),388COUNTABLE(PERF_SP_WAVE_SHORT_SYNC_CYCLES, UINT64, AVERAGE),389COUNTABLE(PERF_SP_WAVE_JOIN_CYCLES, UINT64, AVERAGE),390COUNTABLE(PERF_SP_LM_LOAD_INSTRUCTIONS, UINT64, AVERAGE),391COUNTABLE(PERF_SP_LM_STORE_INSTRUCTIONS, UINT64, AVERAGE),392COUNTABLE(PERF_SP_LM_ATOMICS, UINT64, AVERAGE),393COUNTABLE(PERF_SP_GM_LOAD_INSTRUCTIONS, UINT64, AVERAGE),394COUNTABLE(PERF_SP_GM_STORE_INSTRUCTIONS, UINT64, AVERAGE),395COUNTABLE(PERF_SP_GM_ATOMICS, UINT64, AVERAGE),396COUNTABLE(PERF_SP_VS_STAGE_TEX_INSTRUCTIONS, UINT64, AVERAGE),397COUNTABLE(PERF_SP_VS_STAGE_CFLOW_INSTRUCTIONS, UINT64, AVERAGE),398COUNTABLE(PERF_SP_VS_STAGE_EFU_INSTRUCTIONS, UINT64, AVERAGE),399COUNTABLE(PERF_SP_VS_STAGE_FULL_ALU_INSTRUCTIONS, UINT64, AVERAGE),400COUNTABLE(PERF_SP_VS_STAGE_HALF_ALU_INSTRUCTIONS, UINT64, AVERAGE),401COUNTABLE(PERF_SP_FS_STAGE_TEX_INSTRUCTIONS, UINT64, AVERAGE),402COUNTABLE(PERF_SP_FS_STAGE_CFLOW_INSTRUCTIONS, UINT64, AVERAGE),403COUNTABLE(PERF_SP_FS_STAGE_EFU_INSTRUCTIONS, UINT64, AVERAGE),404COUNTABLE(PERF_SP_FS_STAGE_FULL_ALU_INSTRUCTIONS, UINT64, AVERAGE),405COUNTABLE(PERF_SP_FS_STAGE_HALF_ALU_INSTRUCTIONS, UINT64, AVERAGE),406COUNTABLE(PERF_SP_FS_STAGE_BARY_INSTRUCTIONS, UINT64, AVERAGE),407COUNTABLE(PERF_SP_VS_INSTRUCTIONS, UINT64, AVERAGE),408COUNTABLE(PERF_SP_FS_INSTRUCTIONS, UINT64, AVERAGE),409COUNTABLE(PERF_SP_ADDR_LOCK_COUNT, UINT64, AVERAGE),410COUNTABLE(PERF_SP_UCHE_READ_TRANS, UINT64, AVERAGE),411COUNTABLE(PERF_SP_UCHE_WRITE_TRANS, UINT64, AVERAGE),412COUNTABLE(PERF_SP_EXPORT_VPC_TRANS, UINT64, AVERAGE),413COUNTABLE(PERF_SP_EXPORT_RB_TRANS, UINT64, AVERAGE),414COUNTABLE(PERF_SP_PIXELS_KILLED, UINT64, AVERAGE),415COUNTABLE(PERF_SP_ICL1_REQUESTS, UINT64, AVERAGE),416COUNTABLE(PERF_SP_ICL1_MISSES, UINT64, AVERAGE),417COUNTABLE(PERF_SP_ICL0_REQUESTS, UINT64, AVERAGE),418COUNTABLE(PERF_SP_ICL0_MISSES, UINT64, AVERAGE),419COUNTABLE(PERF_SP_HS_INSTRUCTIONS, UINT64, AVERAGE),420COUNTABLE(PERF_SP_DS_INSTRUCTIONS, UINT64, AVERAGE),421COUNTABLE(PERF_SP_GS_INSTRUCTIONS, UINT64, AVERAGE),422COUNTABLE(PERF_SP_CS_INSTRUCTIONS, UINT64, AVERAGE),423COUNTABLE(PERF_SP_GPR_READ, UINT64, AVERAGE),424COUNTABLE(PERF_SP_GPR_WRITE, UINT64, AVERAGE),425COUNTABLE(PERF_SP_LM_CH0_REQUESTS, UINT64, AVERAGE),426COUNTABLE(PERF_SP_LM_CH1_REQUESTS, UINT64, AVERAGE),427COUNTABLE(PERF_SP_LM_BANK_CONFLICTS, UINT64, AVERAGE),428};429430static const struct fd_perfcntr_counter tp_counters[] = {431COUNTER(TPL1_PERFCTR_TP_SEL_0, RBBM_PERFCTR_TP_0_LO, RBBM_PERFCTR_TP_0_HI),432COUNTER(TPL1_PERFCTR_TP_SEL_1, RBBM_PERFCTR_TP_1_LO, RBBM_PERFCTR_TP_1_HI),433COUNTER(TPL1_PERFCTR_TP_SEL_2, RBBM_PERFCTR_TP_2_LO, RBBM_PERFCTR_TP_2_HI),434COUNTER(TPL1_PERFCTR_TP_SEL_3, RBBM_PERFCTR_TP_3_LO, RBBM_PERFCTR_TP_3_HI),435COUNTER(TPL1_PERFCTR_TP_SEL_4, RBBM_PERFCTR_TP_4_LO, RBBM_PERFCTR_TP_4_HI),436COUNTER(TPL1_PERFCTR_TP_SEL_5, RBBM_PERFCTR_TP_5_LO, RBBM_PERFCTR_TP_5_HI),437COUNTER(TPL1_PERFCTR_TP_SEL_6, RBBM_PERFCTR_TP_6_LO, RBBM_PERFCTR_TP_6_HI),438COUNTER(TPL1_PERFCTR_TP_SEL_7, RBBM_PERFCTR_TP_7_LO, RBBM_PERFCTR_TP_7_HI),439};440441static const struct fd_perfcntr_countable tp_countables[] = {442COUNTABLE(PERF_TP_BUSY_CYCLES, UINT64, AVERAGE),443COUNTABLE(PERF_TP_STALL_CYCLES_UCHE, UINT64, AVERAGE),444COUNTABLE(PERF_TP_LATENCY_CYCLES, UINT64, AVERAGE),445COUNTABLE(PERF_TP_LATENCY_TRANS, UINT64, AVERAGE),446COUNTABLE(PERF_TP_FLAG_CACHE_REQUEST_SAMPLES, UINT64, AVERAGE),447COUNTABLE(PERF_TP_FLAG_CACHE_REQUEST_LATENCY, UINT64, AVERAGE),448COUNTABLE(PERF_TP_L1_CACHELINE_REQUESTS, UINT64, AVERAGE),449COUNTABLE(PERF_TP_L1_CACHELINE_MISSES, UINT64, AVERAGE),450COUNTABLE(PERF_TP_SP_TP_TRANS, UINT64, AVERAGE),451COUNTABLE(PERF_TP_TP_SP_TRANS, UINT64, AVERAGE),452COUNTABLE(PERF_TP_OUTPUT_PIXELS, UINT64, AVERAGE),453COUNTABLE(PERF_TP_FILTER_WORKLOAD_16BIT, UINT64, AVERAGE),454COUNTABLE(PERF_TP_FILTER_WORKLOAD_32BIT, UINT64, AVERAGE),455COUNTABLE(PERF_TP_QUADS_RECEIVED, UINT64, AVERAGE),456COUNTABLE(PERF_TP_QUADS_OFFSET, UINT64, AVERAGE),457COUNTABLE(PERF_TP_QUADS_SHADOW, UINT64, AVERAGE),458COUNTABLE(PERF_TP_QUADS_ARRAY, UINT64, AVERAGE),459COUNTABLE(PERF_TP_QUADS_GRADIENT, UINT64, AVERAGE),460COUNTABLE(PERF_TP_QUADS_1D, UINT64, AVERAGE),461COUNTABLE(PERF_TP_QUADS_2D, UINT64, AVERAGE),462COUNTABLE(PERF_TP_QUADS_BUFFER, UINT64, AVERAGE),463COUNTABLE(PERF_TP_QUADS_3D, UINT64, AVERAGE),464COUNTABLE(PERF_TP_QUADS_CUBE, UINT64, AVERAGE),465COUNTABLE(PERF_TP_STATE_CACHE_REQUESTS, UINT64, AVERAGE),466COUNTABLE(PERF_TP_STATE_CACHE_MISSES, UINT64, AVERAGE),467COUNTABLE(PERF_TP_DIVERGENT_QUADS_RECEIVED, UINT64, AVERAGE),468COUNTABLE(PERF_TP_BINDLESS_STATE_CACHE_REQUESTS, UINT64, AVERAGE),469COUNTABLE(PERF_TP_BINDLESS_STATE_CACHE_MISSES, UINT64, AVERAGE),470COUNTABLE(PERF_TP_PRT_NON_RESIDENT_EVENTS, UINT64, AVERAGE),471COUNTABLE(PERF_TP_OUTPUT_PIXELS_POINT, UINT64, AVERAGE),472COUNTABLE(PERF_TP_OUTPUT_PIXELS_BILINEAR, UINT64, AVERAGE),473COUNTABLE(PERF_TP_OUTPUT_PIXELS_MIP, UINT64, AVERAGE),474COUNTABLE(PERF_TP_OUTPUT_PIXELS_ANISO, UINT64, AVERAGE),475COUNTABLE(PERF_TP_OUTPUT_PIXELS_ZERO_LOD, UINT64, AVERAGE),476COUNTABLE(PERF_TP_FLAG_CACHE_REQUESTS, UINT64, AVERAGE),477COUNTABLE(PERF_TP_FLAG_CACHE_MISSES, UINT64, AVERAGE),478COUNTABLE(PERF_TP_L1_5_L2_REQUESTS, UINT64, AVERAGE),479COUNTABLE(PERF_TP_2D_OUTPUT_PIXELS, UINT64, AVERAGE),480COUNTABLE(PERF_TP_2D_OUTPUT_PIXELS_POINT, UINT64, AVERAGE),481COUNTABLE(PERF_TP_2D_OUTPUT_PIXELS_BILINEAR, UINT64, AVERAGE),482COUNTABLE(PERF_TP_2D_FILTER_WORKLOAD_16BIT, UINT64, AVERAGE),483COUNTABLE(PERF_TP_2D_FILTER_WORKLOAD_32BIT, UINT64, AVERAGE),484};485486static const struct fd_perfcntr_counter uche_counters[] = {487COUNTER(UCHE_PERFCTR_UCHE_SEL_0, RBBM_PERFCTR_UCHE_0_LO, RBBM_PERFCTR_UCHE_0_HI),488COUNTER(UCHE_PERFCTR_UCHE_SEL_1, RBBM_PERFCTR_UCHE_1_LO, RBBM_PERFCTR_UCHE_1_HI),489COUNTER(UCHE_PERFCTR_UCHE_SEL_2, RBBM_PERFCTR_UCHE_2_LO, RBBM_PERFCTR_UCHE_2_HI),490COUNTER(UCHE_PERFCTR_UCHE_SEL_3, RBBM_PERFCTR_UCHE_3_LO, RBBM_PERFCTR_UCHE_3_HI),491COUNTER(UCHE_PERFCTR_UCHE_SEL_4, RBBM_PERFCTR_UCHE_4_LO, RBBM_PERFCTR_UCHE_4_HI),492COUNTER(UCHE_PERFCTR_UCHE_SEL_5, RBBM_PERFCTR_UCHE_5_LO, RBBM_PERFCTR_UCHE_5_HI),493COUNTER(UCHE_PERFCTR_UCHE_SEL_6, RBBM_PERFCTR_UCHE_6_LO, RBBM_PERFCTR_UCHE_6_HI),494COUNTER(UCHE_PERFCTR_UCHE_SEL_7, RBBM_PERFCTR_UCHE_7_LO, RBBM_PERFCTR_UCHE_7_HI),495};496497static const struct fd_perfcntr_countable uche_countables[] = {498COUNTABLE(PERF_UCHE_BUSY_CYCLES, UINT64, AVERAGE),499COUNTABLE(PERF_UCHE_STALL_CYCLES_VBIF, UINT64, AVERAGE),500COUNTABLE(PERF_UCHE_VBIF_LATENCY_CYCLES, UINT64, AVERAGE),501COUNTABLE(PERF_UCHE_VBIF_LATENCY_SAMPLES, UINT64, AVERAGE),502COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_TP, UINT64, AVERAGE),503COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_VFD, UINT64, AVERAGE),504COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_HLSQ, UINT64, AVERAGE),505COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_LRZ, UINT64, AVERAGE),506COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_SP, UINT64, AVERAGE),507COUNTABLE(PERF_UCHE_READ_REQUESTS_TP, UINT64, AVERAGE),508COUNTABLE(PERF_UCHE_READ_REQUESTS_VFD, UINT64, AVERAGE),509COUNTABLE(PERF_UCHE_READ_REQUESTS_HLSQ, UINT64, AVERAGE),510COUNTABLE(PERF_UCHE_READ_REQUESTS_LRZ, UINT64, AVERAGE),511COUNTABLE(PERF_UCHE_READ_REQUESTS_SP, UINT64, AVERAGE),512COUNTABLE(PERF_UCHE_WRITE_REQUESTS_LRZ, UINT64, AVERAGE),513COUNTABLE(PERF_UCHE_WRITE_REQUESTS_SP, UINT64, AVERAGE),514COUNTABLE(PERF_UCHE_WRITE_REQUESTS_VPC, UINT64, AVERAGE),515COUNTABLE(PERF_UCHE_WRITE_REQUESTS_VSC, UINT64, AVERAGE),516COUNTABLE(PERF_UCHE_EVICTS, UINT64, AVERAGE),517COUNTABLE(PERF_UCHE_BANK_REQ0, UINT64, AVERAGE),518COUNTABLE(PERF_UCHE_BANK_REQ1, UINT64, AVERAGE),519COUNTABLE(PERF_UCHE_BANK_REQ2, UINT64, AVERAGE),520COUNTABLE(PERF_UCHE_BANK_REQ3, UINT64, AVERAGE),521COUNTABLE(PERF_UCHE_BANK_REQ4, UINT64, AVERAGE),522COUNTABLE(PERF_UCHE_BANK_REQ5, UINT64, AVERAGE),523COUNTABLE(PERF_UCHE_BANK_REQ6, UINT64, AVERAGE),524COUNTABLE(PERF_UCHE_BANK_REQ7, UINT64, AVERAGE),525COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_CH0, UINT64, AVERAGE),526COUNTABLE(PERF_UCHE_VBIF_READ_BEATS_CH1, UINT64, AVERAGE),527COUNTABLE(PERF_UCHE_GMEM_READ_BEATS, UINT64, AVERAGE),528COUNTABLE(PERF_UCHE_FLAG_COUNT, UINT64, AVERAGE),529};530531static const struct fd_perfcntr_counter vfd_counters[] = {532COUNTER(VFD_PERFCTR_VFD_SEL_0, RBBM_PERFCTR_VFD_0_LO, RBBM_PERFCTR_VFD_0_HI),533COUNTER(VFD_PERFCTR_VFD_SEL_1, RBBM_PERFCTR_VFD_1_LO, RBBM_PERFCTR_VFD_1_HI),534COUNTER(VFD_PERFCTR_VFD_SEL_2, RBBM_PERFCTR_VFD_2_LO, RBBM_PERFCTR_VFD_2_HI),535COUNTER(VFD_PERFCTR_VFD_SEL_3, RBBM_PERFCTR_VFD_3_LO, RBBM_PERFCTR_VFD_3_HI),536COUNTER(VFD_PERFCTR_VFD_SEL_4, RBBM_PERFCTR_VFD_4_LO, RBBM_PERFCTR_VFD_4_HI),537COUNTER(VFD_PERFCTR_VFD_SEL_5, RBBM_PERFCTR_VFD_5_LO, RBBM_PERFCTR_VFD_5_HI),538COUNTER(VFD_PERFCTR_VFD_SEL_6, RBBM_PERFCTR_VFD_6_LO, RBBM_PERFCTR_VFD_6_HI),539COUNTER(VFD_PERFCTR_VFD_SEL_7, RBBM_PERFCTR_VFD_7_LO, RBBM_PERFCTR_VFD_7_HI),540};541542static const struct fd_perfcntr_countable vfd_countables[] = {543COUNTABLE(PERF_VFD_BUSY_CYCLES, UINT64, AVERAGE),544COUNTABLE(PERF_VFD_STALL_CYCLES_UCHE, UINT64, AVERAGE),545COUNTABLE(PERF_VFD_STALL_CYCLES_VPC_ALLOC, UINT64, AVERAGE),546COUNTABLE(PERF_VFD_STALL_CYCLES_MISS_VB, UINT64, AVERAGE),547COUNTABLE(PERF_VFD_STALL_CYCLES_MISS_Q, UINT64, AVERAGE),548COUNTABLE(PERF_VFD_STALL_CYCLES_SP_INFO, UINT64, AVERAGE),549COUNTABLE(PERF_VFD_STALL_CYCLES_SP_ATTR, UINT64, AVERAGE),550COUNTABLE(PERF_VFD_STALL_CYCLES_VFDP_VB, UINT64, AVERAGE),551COUNTABLE(PERF_VFD_STALL_CYCLES_VFDP_Q, UINT64, AVERAGE),552COUNTABLE(PERF_VFD_DECODER_PACKER_STALL, UINT64, AVERAGE),553COUNTABLE(PERF_VFD_STARVE_CYCLES_UCHE, UINT64, AVERAGE),554COUNTABLE(PERF_VFD_RBUFFER_FULL, UINT64, AVERAGE),555COUNTABLE(PERF_VFD_ATTR_INFO_FIFO_FULL, UINT64, AVERAGE),556COUNTABLE(PERF_VFD_DECODED_ATTRIBUTE_BYTES, UINT64, AVERAGE),557COUNTABLE(PERF_VFD_NUM_ATTRIBUTES, UINT64, AVERAGE),558COUNTABLE(PERF_VFD_INSTRUCTIONS, UINT64, AVERAGE),559COUNTABLE(PERF_VFD_UPPER_SHADER_FIBERS, UINT64, AVERAGE),560COUNTABLE(PERF_VFD_LOWER_SHADER_FIBERS, UINT64, AVERAGE),561COUNTABLE(PERF_VFD_MODE_0_FIBERS, UINT64, AVERAGE),562COUNTABLE(PERF_VFD_MODE_1_FIBERS, UINT64, AVERAGE),563COUNTABLE(PERF_VFD_MODE_2_FIBERS, UINT64, AVERAGE),564COUNTABLE(PERF_VFD_MODE_3_FIBERS, UINT64, AVERAGE),565COUNTABLE(PERF_VFD_MODE_4_FIBERS, UINT64, AVERAGE),566COUNTABLE(PERF_VFD_TOTAL_VERTICES, UINT64, AVERAGE),567COUNTABLE(PERF_VFD_NUM_ATTR_MISS, UINT64, AVERAGE),568COUNTABLE(PERF_VFD_1_BURST_REQ, UINT64, AVERAGE),569COUNTABLE(PERF_VFDP_STALL_CYCLES_VFD, UINT64, AVERAGE),570COUNTABLE(PERF_VFDP_STALL_CYCLES_VFD_INDEX, UINT64, AVERAGE),571COUNTABLE(PERF_VFDP_STALL_CYCLES_VFD_PROG, UINT64, AVERAGE),572COUNTABLE(PERF_VFDP_STARVE_CYCLES_PC, UINT64, AVERAGE),573COUNTABLE(PERF_VFDP_VS_STAGE_32_WAVES, UINT64, AVERAGE),574};575576static const struct fd_perfcntr_counter vpc_counters[] = {577COUNTER(VPC_PERFCTR_VPC_SEL_0, RBBM_PERFCTR_VPC_0_LO, RBBM_PERFCTR_VPC_0_HI),578COUNTER(VPC_PERFCTR_VPC_SEL_1, RBBM_PERFCTR_VPC_1_LO, RBBM_PERFCTR_VPC_1_HI),579COUNTER(VPC_PERFCTR_VPC_SEL_2, RBBM_PERFCTR_VPC_2_LO, RBBM_PERFCTR_VPC_2_HI),580COUNTER(VPC_PERFCTR_VPC_SEL_3, RBBM_PERFCTR_VPC_3_LO, RBBM_PERFCTR_VPC_3_HI),581};582583static const struct fd_perfcntr_countable vpc_countables[] = {584COUNTABLE(PERF_VPC_BUSY_CYCLES, UINT64, AVERAGE),585COUNTABLE(PERF_VPC_WORKING_CYCLES, UINT64, AVERAGE),586COUNTABLE(PERF_VPC_STALL_CYCLES_UCHE, UINT64, AVERAGE),587COUNTABLE(PERF_VPC_STALL_CYCLES_VFD_WACK, UINT64, AVERAGE),588COUNTABLE(PERF_VPC_STALL_CYCLES_HLSQ_PRIM_ALLOC, UINT64, AVERAGE),589COUNTABLE(PERF_VPC_STALL_CYCLES_PC, UINT64, AVERAGE),590COUNTABLE(PERF_VPC_STALL_CYCLES_SP_LM, UINT64, AVERAGE),591COUNTABLE(PERF_VPC_POS_EXPORT_STALL_CYCLES, UINT64, AVERAGE),592COUNTABLE(PERF_VPC_STARVE_CYCLES_SP, UINT64, AVERAGE),593COUNTABLE(PERF_VPC_STARVE_CYCLES_LRZ, UINT64, AVERAGE),594COUNTABLE(PERF_VPC_PC_PRIMITIVES, UINT64, AVERAGE),595COUNTABLE(PERF_VPC_SP_COMPONENTS, UINT64, AVERAGE),596COUNTABLE(PERF_VPC_SP_LM_PRIMITIVES, UINT64, AVERAGE),597COUNTABLE(PERF_VPC_SP_LM_COMPONENTS, UINT64, AVERAGE),598COUNTABLE(PERF_VPC_SP_LM_DWORDS, UINT64, AVERAGE),599COUNTABLE(PERF_VPC_STREAMOUT_COMPONENTS, UINT64, AVERAGE),600COUNTABLE(PERF_VPC_GRANT_PHASES, UINT64, AVERAGE),601};602603static const struct fd_perfcntr_counter vsc_counters[] = {604COUNTER(VSC_PERFCTR_VSC_SEL_0, RBBM_PERFCTR_VSC_0_LO, RBBM_PERFCTR_VSC_0_HI),605COUNTER(VSC_PERFCTR_VSC_SEL_1, RBBM_PERFCTR_VSC_1_LO, RBBM_PERFCTR_VSC_1_HI),606};607608static const struct fd_perfcntr_countable vsc_countables[] = {609COUNTABLE(PERF_VSC_BUSY_CYCLES, UINT64, AVERAGE),610COUNTABLE(PERF_VSC_WORKING_CYCLES, UINT64, AVERAGE),611COUNTABLE(PERF_VSC_STALL_CYCLES_UCHE, UINT64, AVERAGE),612COUNTABLE(PERF_VSC_EOT_NUM, UINT64, AVERAGE),613};614615/* VBIF counters probably not too userful for userspace, and they make616* frameretrace take many more passes to collect all the metrics, so617* for now let's hide them.618*/619#if 0620/* VBIF counters break the pattern a bit, with enable and clear regs: */621static const struct fd_perfcntr_counter vbif_counters[] = {622COUNTER2(VBIF_PERF_CNT_SEL0, VBIF_PERF_CNT_LOW0, VBIF_PERF_CNT_HIGH0, VBIF_PERF_CNT_EN0, VBIF_PERF_CNT_CLR0),623COUNTER2(VBIF_PERF_CNT_SEL1, VBIF_PERF_CNT_LOW1, VBIF_PERF_CNT_HIGH1, VBIF_PERF_CNT_EN1, VBIF_PERF_CNT_CLR1),624COUNTER2(VBIF_PERF_CNT_SEL2, VBIF_PERF_CNT_LOW2, VBIF_PERF_CNT_HIGH2, VBIF_PERF_CNT_EN2, VBIF_PERF_CNT_CLR2),625COUNTER2(VBIF_PERF_CNT_SEL3, VBIF_PERF_CNT_LOW3, VBIF_PERF_CNT_HIGH3, VBIF_PERF_CNT_EN3, VBIF_PERF_CNT_CLR3),626};627628static const struct fd_perfcntr_countable vbif_countables[] = {629COUNTABLE(AXI_READ_REQUESTS_ID_0, UINT64, AVERAGE),630COUNTABLE(AXI_READ_REQUESTS_ID_1, UINT64, AVERAGE),631COUNTABLE(AXI_READ_REQUESTS_ID_2, UINT64, AVERAGE),632COUNTABLE(AXI_READ_REQUESTS_ID_3, UINT64, AVERAGE),633COUNTABLE(AXI_READ_REQUESTS_ID_4, UINT64, AVERAGE),634COUNTABLE(AXI_READ_REQUESTS_ID_5, UINT64, AVERAGE),635COUNTABLE(AXI_READ_REQUESTS_ID_6, UINT64, AVERAGE),636COUNTABLE(AXI_READ_REQUESTS_ID_7, UINT64, AVERAGE),637COUNTABLE(AXI_READ_REQUESTS_ID_8, UINT64, AVERAGE),638COUNTABLE(AXI_READ_REQUESTS_ID_9, UINT64, AVERAGE),639COUNTABLE(AXI_READ_REQUESTS_ID_10, UINT64, AVERAGE),640COUNTABLE(AXI_READ_REQUESTS_ID_11, UINT64, AVERAGE),641COUNTABLE(AXI_READ_REQUESTS_ID_12, UINT64, AVERAGE),642COUNTABLE(AXI_READ_REQUESTS_ID_13, UINT64, AVERAGE),643COUNTABLE(AXI_READ_REQUESTS_ID_14, UINT64, AVERAGE),644COUNTABLE(AXI_READ_REQUESTS_ID_15, UINT64, AVERAGE),645COUNTABLE(AXI0_READ_REQUESTS_TOTAL, UINT64, AVERAGE),646COUNTABLE(AXI1_READ_REQUESTS_TOTAL, UINT64, AVERAGE),647COUNTABLE(AXI2_READ_REQUESTS_TOTAL, UINT64, AVERAGE),648COUNTABLE(AXI3_READ_REQUESTS_TOTAL, UINT64, AVERAGE),649COUNTABLE(AXI_READ_REQUESTS_TOTAL, UINT64, AVERAGE),650COUNTABLE(AXI_WRITE_REQUESTS_ID_0, UINT64, AVERAGE),651COUNTABLE(AXI_WRITE_REQUESTS_ID_1, UINT64, AVERAGE),652COUNTABLE(AXI_WRITE_REQUESTS_ID_2, UINT64, AVERAGE),653COUNTABLE(AXI_WRITE_REQUESTS_ID_3, UINT64, AVERAGE),654COUNTABLE(AXI_WRITE_REQUESTS_ID_4, UINT64, AVERAGE),655COUNTABLE(AXI_WRITE_REQUESTS_ID_5, UINT64, AVERAGE),656COUNTABLE(AXI_WRITE_REQUESTS_ID_6, UINT64, AVERAGE),657COUNTABLE(AXI_WRITE_REQUESTS_ID_7, UINT64, AVERAGE),658COUNTABLE(AXI_WRITE_REQUESTS_ID_8, UINT64, AVERAGE),659COUNTABLE(AXI_WRITE_REQUESTS_ID_9, UINT64, AVERAGE),660COUNTABLE(AXI_WRITE_REQUESTS_ID_10, UINT64, AVERAGE),661COUNTABLE(AXI_WRITE_REQUESTS_ID_11, UINT64, AVERAGE),662COUNTABLE(AXI_WRITE_REQUESTS_ID_12, UINT64, AVERAGE),663COUNTABLE(AXI_WRITE_REQUESTS_ID_13, UINT64, AVERAGE),664COUNTABLE(AXI_WRITE_REQUESTS_ID_14, UINT64, AVERAGE),665COUNTABLE(AXI_WRITE_REQUESTS_ID_15, UINT64, AVERAGE),666COUNTABLE(AXI0_WRITE_REQUESTS_TOTAL, UINT64, AVERAGE),667COUNTABLE(AXI1_WRITE_REQUESTS_TOTAL, UINT64, AVERAGE),668COUNTABLE(AXI2_WRITE_REQUESTS_TOTAL, UINT64, AVERAGE),669COUNTABLE(AXI3_WRITE_REQUESTS_TOTAL, UINT64, AVERAGE),670COUNTABLE(AXI_WRITE_REQUESTS_TOTAL, UINT64, AVERAGE),671COUNTABLE(AXI_TOTAL_REQUESTS, UINT64, AVERAGE),672COUNTABLE(AXI_READ_DATA_BEATS_ID_0, UINT64, AVERAGE),673COUNTABLE(AXI_READ_DATA_BEATS_ID_1, UINT64, AVERAGE),674COUNTABLE(AXI_READ_DATA_BEATS_ID_2, UINT64, AVERAGE),675COUNTABLE(AXI_READ_DATA_BEATS_ID_3, UINT64, AVERAGE),676COUNTABLE(AXI_READ_DATA_BEATS_ID_4, UINT64, AVERAGE),677COUNTABLE(AXI_READ_DATA_BEATS_ID_5, UINT64, AVERAGE),678COUNTABLE(AXI_READ_DATA_BEATS_ID_6, UINT64, AVERAGE),679COUNTABLE(AXI_READ_DATA_BEATS_ID_7, UINT64, AVERAGE),680COUNTABLE(AXI_READ_DATA_BEATS_ID_8, UINT64, AVERAGE),681COUNTABLE(AXI_READ_DATA_BEATS_ID_9, UINT64, AVERAGE),682COUNTABLE(AXI_READ_DATA_BEATS_ID_10, UINT64, AVERAGE),683COUNTABLE(AXI_READ_DATA_BEATS_ID_11, UINT64, AVERAGE),684COUNTABLE(AXI_READ_DATA_BEATS_ID_12, UINT64, AVERAGE),685COUNTABLE(AXI_READ_DATA_BEATS_ID_13, UINT64, AVERAGE),686COUNTABLE(AXI_READ_DATA_BEATS_ID_14, UINT64, AVERAGE),687COUNTABLE(AXI_READ_DATA_BEATS_ID_15, UINT64, AVERAGE),688COUNTABLE(AXI0_READ_DATA_BEATS_TOTAL, UINT64, AVERAGE),689COUNTABLE(AXI1_READ_DATA_BEATS_TOTAL, UINT64, AVERAGE),690COUNTABLE(AXI2_READ_DATA_BEATS_TOTAL, UINT64, AVERAGE),691COUNTABLE(AXI3_READ_DATA_BEATS_TOTAL, UINT64, AVERAGE),692COUNTABLE(AXI_READ_DATA_BEATS_TOTAL, UINT64, AVERAGE),693COUNTABLE(AXI_WRITE_DATA_BEATS_ID_0, UINT64, AVERAGE),694COUNTABLE(AXI_WRITE_DATA_BEATS_ID_1, UINT64, AVERAGE),695COUNTABLE(AXI_WRITE_DATA_BEATS_ID_2, UINT64, AVERAGE),696COUNTABLE(AXI_WRITE_DATA_BEATS_ID_3, UINT64, AVERAGE),697COUNTABLE(AXI_WRITE_DATA_BEATS_ID_4, UINT64, AVERAGE),698COUNTABLE(AXI_WRITE_DATA_BEATS_ID_5, UINT64, AVERAGE),699COUNTABLE(AXI_WRITE_DATA_BEATS_ID_6, UINT64, AVERAGE),700COUNTABLE(AXI_WRITE_DATA_BEATS_ID_7, UINT64, AVERAGE),701COUNTABLE(AXI_WRITE_DATA_BEATS_ID_8, UINT64, AVERAGE),702COUNTABLE(AXI_WRITE_DATA_BEATS_ID_9, UINT64, AVERAGE),703COUNTABLE(AXI_WRITE_DATA_BEATS_ID_10, UINT64, AVERAGE),704COUNTABLE(AXI_WRITE_DATA_BEATS_ID_11, UINT64, AVERAGE),705COUNTABLE(AXI_WRITE_DATA_BEATS_ID_12, UINT64, AVERAGE),706COUNTABLE(AXI_WRITE_DATA_BEATS_ID_13, UINT64, AVERAGE),707COUNTABLE(AXI_WRITE_DATA_BEATS_ID_14, UINT64, AVERAGE),708COUNTABLE(AXI_WRITE_DATA_BEATS_ID_15, UINT64, AVERAGE),709COUNTABLE(AXI0_WRITE_DATA_BEATS_TOTAL, UINT64, AVERAGE),710COUNTABLE(AXI1_WRITE_DATA_BEATS_TOTAL, UINT64, AVERAGE),711COUNTABLE(AXI2_WRITE_DATA_BEATS_TOTAL, UINT64, AVERAGE),712COUNTABLE(AXI3_WRITE_DATA_BEATS_TOTAL, UINT64, AVERAGE),713COUNTABLE(AXI_WRITE_DATA_BEATS_TOTAL, UINT64, AVERAGE),714COUNTABLE(AXI_DATA_BEATS_TOTAL, UINT64, AVERAGE),715};716#endif717718const struct fd_perfcntr_group a5xx_perfcntr_groups[] = {719GROUP("CP", cp_counters, cp_countables),720GROUP("CCU", ccu_counters, ccu_countables),721GROUP("TSE", tse_counters, tse_countables),722GROUP("RAS", ras_counters, ras_countables),723GROUP("LRZ", lrz_counters, lrz_countables),724GROUP("HLSQ", hlsq_counters, hlsq_countables),725GROUP("PC", pc_counters, pc_countables),726GROUP("RB", rb_counters, rb_countables),727GROUP("RBBM", rbbm_counters, rbbm_countables),728GROUP("SP", sp_counters, sp_countables),729GROUP("TP", tp_counters, tp_countables),730GROUP("UCHE", uche_counters, uche_countables),731GROUP("VFD", vfd_counters, vfd_countables),732GROUP("VPC", vpc_counters, vpc_countables),733GROUP("VSC", vsc_counters, vsc_countables),734// GROUP("VBIF", vbif_counters, vbif_countables),735};736737const unsigned a5xx_num_perfcntr_groups = ARRAY_SIZE(a5xx_perfcntr_groups);738739#endif /* FD5_PERFCNTR_H_ */740741742