freedreno: update generated headers
[mesa.git] / src / gallium / drivers / freedreno / a4xx / a4xx.xml.h
index 4436697aad4ba14d1cbe0d47dcf1258367f6ab2c..2dfdc281957cf2ac449949d3d6bb7deb7479c902 100644 (file)
@@ -8,17 +8,19 @@ http://github.com/freedreno/envytools/
 git clone https://github.com/freedreno/envytools.git
 
 The rules-ng-ng source files this header was generated from are:
-- /home/robclark/src/freedreno/envytools/rnndb/adreno.xml               (    398 bytes, from 2015-09-24 17:25:31)
-- /home/robclark/src/freedreno/envytools/rnndb/freedreno_copyright.xml  (   1453 bytes, from 2015-05-20 20:03:07)
-- /home/robclark/src/freedreno/envytools/rnndb/adreno/a2xx.xml          (  32901 bytes, from 2015-05-20 20:03:14)
-- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_common.xml (  10755 bytes, from 2015-09-14 20:46:55)
-- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_pm4.xml    (  14968 bytes, from 2015-05-20 20:12:27)
-- /home/robclark/src/freedreno/envytools/rnndb/adreno/a3xx.xml          (  68291 bytes, from 2015-11-17 16:39:59)
-- /home/robclark/src/freedreno/envytools/rnndb/adreno/a4xx.xml          (  64038 bytes, from 2015-11-17 16:37:36)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno.xml               (    431 bytes, from 2016-04-26 17:56:44)
+- /home/robclark/src/freedreno/envytools/rnndb/freedreno_copyright.xml  (   1572 bytes, from 2016-02-10 17:07:21)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a2xx.xml          (  32907 bytes, from 2016-11-26 23:01:08)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_common.xml (  12025 bytes, from 2016-11-26 23:01:08)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_pm4.xml    (  23277 bytes, from 2016-12-24 05:01:47)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a3xx.xml          (  83840 bytes, from 2016-11-26 23:01:08)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a4xx.xml          ( 110757 bytes, from 2016-12-26 17:51:07)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a5xx.xml          (  99436 bytes, from 2017-01-10 16:36:25)
 - /home/robclark/src/freedreno/envytools/rnndb/adreno/ocmem.xml         (   1773 bytes, from 2015-09-24 17:30:00)
 
-Copyright (C) 2013-2015 by the following authors:
+Copyright (C) 2013-2016 by the following authors:
 - Rob Clark <robdclark@gmail.com> (robclark)
+- Ilia Mirkin <imirkin@alum.mit.edu> (imirkin)
 
 Permission is hereby granted, free of charge, to any person obtaining
 a copy of this software and associated documentation files (the
@@ -45,6 +47,9 @@ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 enum a4xx_color_fmt {
        RB4_A8_UNORM = 1,
        RB4_R8_UNORM = 2,
+       RB4_R8_SNORM = 3,
+       RB4_R8_UINT = 4,
+       RB4_R8_SINT = 5,
        RB4_R4G4B4A4_UNORM = 8,
        RB4_R5G5B5A1_UNORM = 10,
        RB4_R5G6B5_UNORM = 14,
@@ -88,17 +93,10 @@ enum a4xx_color_fmt {
 
 enum a4xx_tile_mode {
        TILE4_LINEAR = 0,
+       TILE4_2 = 2,
        TILE4_3 = 3,
 };
 
-enum a4xx_rb_blend_opcode {
-       BLEND_DST_PLUS_SRC = 0,
-       BLEND_SRC_MINUS_DST = 1,
-       BLEND_DST_MINUS_SRC = 2,
-       BLEND_MIN_DST_SRC = 3,
-       BLEND_MAX_DST_SRC = 4,
-};
-
 enum a4xx_vtx_fmt {
        VFMT4_32_FLOAT = 1,
        VFMT4_32_32_FLOAT = 2,
@@ -112,6 +110,7 @@ enum a4xx_vtx_fmt {
        VFMT4_32_32_FIXED = 10,
        VFMT4_32_32_32_FIXED = 11,
        VFMT4_32_32_32_32_FIXED = 12,
+       VFMT4_11_11_10_FLOAT = 13,
        VFMT4_16_SINT = 16,
        VFMT4_16_16_SINT = 17,
        VFMT4_16_16_16_SINT = 18,
@@ -152,58 +151,66 @@ enum a4xx_vtx_fmt {
        VFMT4_8_8_SNORM = 53,
        VFMT4_8_8_8_SNORM = 54,
        VFMT4_8_8_8_8_SNORM = 55,
-       VFMT4_10_10_10_2_UINT = 60,
-       VFMT4_10_10_10_2_UNORM = 61,
-       VFMT4_10_10_10_2_SINT = 62,
-       VFMT4_10_10_10_2_SNORM = 63,
+       VFMT4_10_10_10_2_UINT = 56,
+       VFMT4_10_10_10_2_UNORM = 57,
+       VFMT4_10_10_10_2_SINT = 58,
+       VFMT4_10_10_10_2_SNORM = 59,
+       VFMT4_2_10_10_10_UINT = 60,
+       VFMT4_2_10_10_10_UNORM = 61,
+       VFMT4_2_10_10_10_SINT = 62,
+       VFMT4_2_10_10_10_SNORM = 63,
 };
 
 enum a4xx_tex_fmt {
-       TFMT4_5_6_5_UNORM = 11,
-       TFMT4_5_5_5_1_UNORM = 9,
-       TFMT4_4_4_4_4_UNORM = 8,
-       TFMT4_X8Z24_UNORM = 71,
-       TFMT4_10_10_10_2_UNORM = 33,
        TFMT4_A8_UNORM = 3,
-       TFMT4_L8_A8_UNORM = 13,
        TFMT4_8_UNORM = 4,
-       TFMT4_8_8_UNORM = 14,
-       TFMT4_8_8_8_8_UNORM = 28,
        TFMT4_8_SNORM = 5,
-       TFMT4_8_8_SNORM = 15,
-       TFMT4_8_8_8_8_SNORM = 29,
        TFMT4_8_UINT = 6,
-       TFMT4_8_8_UINT = 16,
-       TFMT4_8_8_8_8_UINT = 30,
        TFMT4_8_SINT = 7,
+       TFMT4_4_4_4_4_UNORM = 8,
+       TFMT4_5_5_5_1_UNORM = 9,
+       TFMT4_5_6_5_UNORM = 11,
+       TFMT4_L8_A8_UNORM = 13,
+       TFMT4_8_8_UNORM = 14,
+       TFMT4_8_8_SNORM = 15,
+       TFMT4_8_8_UINT = 16,
        TFMT4_8_8_SINT = 17,
-       TFMT4_8_8_8_8_SINT = 31,
        TFMT4_16_UNORM = 18,
-       TFMT4_16_16_UNORM = 38,
-       TFMT4_16_16_16_16_UNORM = 51,
        TFMT4_16_SNORM = 19,
-       TFMT4_16_16_SNORM = 39,
-       TFMT4_16_16_16_16_SNORM = 52,
+       TFMT4_16_FLOAT = 20,
        TFMT4_16_UINT = 21,
-       TFMT4_16_16_UINT = 41,
-       TFMT4_16_16_16_16_UINT = 54,
        TFMT4_16_SINT = 22,
+       TFMT4_8_8_8_8_UNORM = 28,
+       TFMT4_8_8_8_8_SNORM = 29,
+       TFMT4_8_8_8_8_UINT = 30,
+       TFMT4_8_8_8_8_SINT = 31,
+       TFMT4_9_9_9_E5_FLOAT = 32,
+       TFMT4_10_10_10_2_UNORM = 33,
+       TFMT4_10_10_10_2_UINT = 34,
+       TFMT4_11_11_10_FLOAT = 37,
+       TFMT4_16_16_UNORM = 38,
+       TFMT4_16_16_SNORM = 39,
+       TFMT4_16_16_FLOAT = 40,
+       TFMT4_16_16_UINT = 41,
        TFMT4_16_16_SINT = 42,
-       TFMT4_16_16_16_16_SINT = 55,
+       TFMT4_32_FLOAT = 43,
        TFMT4_32_UINT = 44,
-       TFMT4_32_32_UINT = 57,
-       TFMT4_32_32_32_32_UINT = 64,
        TFMT4_32_SINT = 45,
-       TFMT4_32_32_SINT = 58,
-       TFMT4_32_32_32_32_SINT = 65,
-       TFMT4_16_FLOAT = 20,
-       TFMT4_16_16_FLOAT = 40,
+       TFMT4_16_16_16_16_UNORM = 51,
+       TFMT4_16_16_16_16_SNORM = 52,
        TFMT4_16_16_16_16_FLOAT = 53,
-       TFMT4_32_FLOAT = 43,
+       TFMT4_16_16_16_16_UINT = 54,
+       TFMT4_16_16_16_16_SINT = 55,
        TFMT4_32_32_FLOAT = 56,
+       TFMT4_32_32_UINT = 57,
+       TFMT4_32_32_SINT = 58,
+       TFMT4_32_32_32_FLOAT = 59,
+       TFMT4_32_32_32_UINT = 60,
+       TFMT4_32_32_32_SINT = 61,
        TFMT4_32_32_32_32_FLOAT = 63,
-       TFMT4_9_9_9_E5_FLOAT = 32,
-       TFMT4_11_11_10_FLOAT = 37,
+       TFMT4_32_32_32_32_UINT = 64,
+       TFMT4_32_32_32_32_SINT = 65,
+       TFMT4_X8Z24_UNORM = 71,
        TFMT4_DXT1 = 86,
        TFMT4_DXT3 = 87,
        TFMT4_DXT5 = 88,
@@ -262,6 +269,545 @@ enum a4xx_tess_spacing {
        EVEN_SPACING = 3,
 };
 
+enum a4xx_ccu_perfcounter_select {
+       CCU_BUSY_CYCLES = 0,
+       CCU_RB_DEPTH_RETURN_STALL = 2,
+       CCU_RB_COLOR_RETURN_STALL = 3,
+       CCU_DEPTH_BLOCKS = 6,
+       CCU_COLOR_BLOCKS = 7,
+       CCU_DEPTH_BLOCK_HIT = 8,
+       CCU_COLOR_BLOCK_HIT = 9,
+       CCU_DEPTH_FLAG1_COUNT = 10,
+       CCU_DEPTH_FLAG2_COUNT = 11,
+       CCU_DEPTH_FLAG3_COUNT = 12,
+       CCU_DEPTH_FLAG4_COUNT = 13,
+       CCU_COLOR_FLAG1_COUNT = 14,
+       CCU_COLOR_FLAG2_COUNT = 15,
+       CCU_COLOR_FLAG3_COUNT = 16,
+       CCU_COLOR_FLAG4_COUNT = 17,
+       CCU_PARTIAL_BLOCK_READ = 18,
+};
+
+enum a4xx_cp_perfcounter_select {
+       CP_ALWAYS_COUNT = 0,
+       CP_BUSY = 1,
+       CP_PFP_IDLE = 2,
+       CP_PFP_BUSY_WORKING = 3,
+       CP_PFP_STALL_CYCLES_ANY = 4,
+       CP_PFP_STARVE_CYCLES_ANY = 5,
+       CP_PFP_STARVED_PER_LOAD_ADDR = 6,
+       CP_PFP_STALLED_PER_STORE_ADDR = 7,
+       CP_PFP_PC_PROFILE = 8,
+       CP_PFP_MATCH_PM4_PKT_PROFILE = 9,
+       CP_PFP_COND_INDIRECT_DISCARDED = 10,
+       CP_LONG_RESUMPTIONS = 11,
+       CP_RESUME_CYCLES = 12,
+       CP_RESUME_TO_BOUNDARY_CYCLES = 13,
+       CP_LONG_PREEMPTIONS = 14,
+       CP_PREEMPT_CYCLES = 15,
+       CP_PREEMPT_TO_BOUNDARY_CYCLES = 16,
+       CP_ME_FIFO_EMPTY_PFP_IDLE = 17,
+       CP_ME_FIFO_EMPTY_PFP_BUSY = 18,
+       CP_ME_FIFO_NOT_EMPTY_NOT_FULL = 19,
+       CP_ME_FIFO_FULL_ME_BUSY = 20,
+       CP_ME_FIFO_FULL_ME_NON_WORKING = 21,
+       CP_ME_WAITING_FOR_PACKETS = 22,
+       CP_ME_BUSY_WORKING = 23,
+       CP_ME_STARVE_CYCLES_ANY = 24,
+       CP_ME_STARVE_CYCLES_PER_PROFILE = 25,
+       CP_ME_STALL_CYCLES_PER_PROFILE = 26,
+       CP_ME_PC_PROFILE = 27,
+       CP_RCIU_FIFO_EMPTY = 28,
+       CP_RCIU_FIFO_NOT_EMPTY_NOT_FULL = 29,
+       CP_RCIU_FIFO_FULL = 30,
+       CP_RCIU_FIFO_FULL_NO_CONTEXT = 31,
+       CP_RCIU_FIFO_FULL_AHB_MASTER = 32,
+       CP_RCIU_FIFO_FULL_OTHER = 33,
+       CP_AHB_IDLE = 34,
+       CP_AHB_STALL_ON_GRANT_NO_SPLIT = 35,
+       CP_AHB_STALL_ON_GRANT_SPLIT = 36,
+       CP_AHB_STALL_ON_GRANT_SPLIT_PROFILE = 37,
+       CP_AHB_BUSY_WORKING = 38,
+       CP_AHB_BUSY_STALL_ON_HRDY = 39,
+       CP_AHB_BUSY_STALL_ON_HRDY_PROFILE = 40,
+};
+
+enum a4xx_gras_ras_perfcounter_select {
+       RAS_SUPER_TILES = 0,
+       RAS_8X8_TILES = 1,
+       RAS_4X4_TILES = 2,
+       RAS_BUSY_CYCLES = 3,
+       RAS_STALL_CYCLES_BY_RB = 4,
+       RAS_STALL_CYCLES_BY_VSC = 5,
+       RAS_STARVE_CYCLES_BY_TSE = 6,
+       RAS_SUPERTILE_CYCLES = 7,
+       RAS_TILE_CYCLES = 8,
+       RAS_FULLY_COVERED_SUPER_TILES = 9,
+       RAS_FULLY_COVERED_8X8_TILES = 10,
+       RAS_4X4_PRIM = 11,
+       RAS_8X4_4X8_PRIM = 12,
+       RAS_8X8_PRIM = 13,
+};
+
+enum a4xx_gras_tse_perfcounter_select {
+       TSE_INPUT_PRIM = 0,
+       TSE_INPUT_NULL_PRIM = 1,
+       TSE_TRIVAL_REJ_PRIM = 2,
+       TSE_CLIPPED_PRIM = 3,
+       TSE_NEW_PRIM = 4,
+       TSE_ZERO_AREA_PRIM = 5,
+       TSE_FACENESS_CULLED_PRIM = 6,
+       TSE_ZERO_PIXEL_PRIM = 7,
+       TSE_OUTPUT_NULL_PRIM = 8,
+       TSE_OUTPUT_VISIBLE_PRIM = 9,
+       TSE_PRE_CLIP_PRIM = 10,
+       TSE_POST_CLIP_PRIM = 11,
+       TSE_BUSY_CYCLES = 12,
+       TSE_PC_STARVE = 13,
+       TSE_RAS_STALL = 14,
+       TSE_STALL_BARYPLANE_FIFO_FULL = 15,
+       TSE_STALL_ZPLANE_FIFO_FULL = 16,
+};
+
+enum a4xx_hlsq_perfcounter_select {
+       HLSQ_SP_VS_STAGE_CONSTANT = 0,
+       HLSQ_SP_VS_STAGE_INSTRUCTIONS = 1,
+       HLSQ_SP_FS_STAGE_CONSTANT = 2,
+       HLSQ_SP_FS_STAGE_INSTRUCTIONS = 3,
+       HLSQ_TP_STATE = 4,
+       HLSQ_QUADS = 5,
+       HLSQ_PIXELS = 6,
+       HLSQ_VERTICES = 7,
+       HLSQ_SP_VS_STAGE_DATA_BYTES = 13,
+       HLSQ_SP_FS_STAGE_DATA_BYTES = 14,
+       HLSQ_BUSY_CYCLES = 15,
+       HLSQ_STALL_CYCLES_SP_STATE = 16,
+       HLSQ_STALL_CYCLES_SP_VS_STAGE = 17,
+       HLSQ_STALL_CYCLES_SP_FS_STAGE = 18,
+       HLSQ_STALL_CYCLES_UCHE = 19,
+       HLSQ_RBBM_LOAD_CYCLES = 20,
+       HLSQ_DI_TO_VS_START_SP = 21,
+       HLSQ_DI_TO_FS_START_SP = 22,
+       HLSQ_VS_STAGE_START_TO_DONE_SP = 23,
+       HLSQ_FS_STAGE_START_TO_DONE_SP = 24,
+       HLSQ_SP_STATE_COPY_CYCLES_VS_STAGE = 25,
+       HLSQ_SP_STATE_COPY_CYCLES_FS_STAGE = 26,
+       HLSQ_UCHE_LATENCY_CYCLES = 27,
+       HLSQ_UCHE_LATENCY_COUNT = 28,
+       HLSQ_STARVE_CYCLES_VFD = 29,
+};
+
+enum a4xx_pc_perfcounter_select {
+       PC_VIS_STREAMS_LOADED = 0,
+       PC_VPC_PRIMITIVES = 2,
+       PC_DEAD_PRIM = 3,
+       PC_LIVE_PRIM = 4,
+       PC_DEAD_DRAWCALLS = 5,
+       PC_LIVE_DRAWCALLS = 6,
+       PC_VERTEX_MISSES = 7,
+       PC_STALL_CYCLES_VFD = 9,
+       PC_STALL_CYCLES_TSE = 10,
+       PC_STALL_CYCLES_UCHE = 11,
+       PC_WORKING_CYCLES = 12,
+       PC_IA_VERTICES = 13,
+       PC_GS_PRIMITIVES = 14,
+       PC_HS_INVOCATIONS = 15,
+       PC_DS_INVOCATIONS = 16,
+       PC_DS_PRIMITIVES = 17,
+       PC_STARVE_CYCLES_FOR_INDEX = 20,
+       PC_STARVE_CYCLES_FOR_TESS_FACTOR = 21,
+       PC_STARVE_CYCLES_FOR_VIZ_STREAM = 22,
+       PC_STALL_CYCLES_TESS = 23,
+       PC_STARVE_CYCLES_FOR_POSITION = 24,
+       PC_MODE0_DRAWCALL = 25,
+       PC_MODE1_DRAWCALL = 26,
+       PC_MODE2_DRAWCALL = 27,
+       PC_MODE3_DRAWCALL = 28,
+       PC_MODE4_DRAWCALL = 29,
+       PC_PREDICATED_DEAD_DRAWCALL = 30,
+       PC_STALL_CYCLES_BY_TSE_ONLY = 31,
+       PC_STALL_CYCLES_BY_VPC_ONLY = 32,
+       PC_VPC_POS_DATA_TRANSACTION = 33,
+       PC_BUSY_CYCLES = 34,
+       PC_STARVE_CYCLES_DI = 35,
+       PC_STALL_CYCLES_VPC = 36,
+       TESS_WORKING_CYCLES = 37,
+       TESS_NUM_CYCLES_SETUP_WORKING = 38,
+       TESS_NUM_CYCLES_PTGEN_WORKING = 39,
+       TESS_NUM_CYCLES_CONNGEN_WORKING = 40,
+       TESS_BUSY_CYCLES = 41,
+       TESS_STARVE_CYCLES_PC = 42,
+       TESS_STALL_CYCLES_PC = 43,
+};
+
+enum a4xx_pwr_perfcounter_select {
+       PWR_CORE_CLOCK_CYCLES = 0,
+       PWR_BUSY_CLOCK_CYCLES = 1,
+};
+
+enum a4xx_rb_perfcounter_select {
+       RB_BUSY_CYCLES = 0,
+       RB_BUSY_CYCLES_BINNING = 1,
+       RB_BUSY_CYCLES_RENDERING = 2,
+       RB_BUSY_CYCLES_RESOLVE = 3,
+       RB_STARVE_CYCLES_BY_SP = 4,
+       RB_STARVE_CYCLES_BY_RAS = 5,
+       RB_STARVE_CYCLES_BY_MARB = 6,
+       RB_STALL_CYCLES_BY_MARB = 7,
+       RB_STALL_CYCLES_BY_HLSQ = 8,
+       RB_RB_RB_MARB_DATA = 9,
+       RB_SP_RB_QUAD = 10,
+       RB_RAS_RB_Z_QUADS = 11,
+       RB_GMEM_CH0_READ = 12,
+       RB_GMEM_CH1_READ = 13,
+       RB_GMEM_CH0_WRITE = 14,
+       RB_GMEM_CH1_WRITE = 15,
+       RB_CP_CONTEXT_DONE = 16,
+       RB_CP_CACHE_FLUSH = 17,
+       RB_CP_ZPASS_DONE = 18,
+       RB_STALL_FIFO0_FULL = 19,
+       RB_STALL_FIFO1_FULL = 20,
+       RB_STALL_FIFO2_FULL = 21,
+       RB_STALL_FIFO3_FULL = 22,
+       RB_RB_HLSQ_TRANSACTIONS = 23,
+       RB_Z_READ = 24,
+       RB_Z_WRITE = 25,
+       RB_C_READ = 26,
+       RB_C_WRITE = 27,
+       RB_C_READ_LATENCY = 28,
+       RB_Z_READ_LATENCY = 29,
+       RB_STALL_BY_UCHE = 30,
+       RB_MARB_UCHE_TRANSACTIONS = 31,
+       RB_CACHE_STALL_MISS = 32,
+       RB_CACHE_STALL_FIFO_FULL = 33,
+       RB_8BIT_BLENDER_UNITS_ACTIVE = 34,
+       RB_16BIT_BLENDER_UNITS_ACTIVE = 35,
+       RB_SAMPLER_UNITS_ACTIVE = 36,
+       RB_TOTAL_PASS = 38,
+       RB_Z_PASS = 39,
+       RB_Z_FAIL = 40,
+       RB_S_FAIL = 41,
+       RB_POWER0 = 42,
+       RB_POWER1 = 43,
+       RB_POWER2 = 44,
+       RB_POWER3 = 45,
+       RB_POWER4 = 46,
+       RB_POWER5 = 47,
+       RB_POWER6 = 48,
+       RB_POWER7 = 49,
+};
+
+enum a4xx_rbbm_perfcounter_select {
+       RBBM_ALWAYS_ON = 0,
+       RBBM_VBIF_BUSY = 1,
+       RBBM_TSE_BUSY = 2,
+       RBBM_RAS_BUSY = 3,
+       RBBM_PC_DCALL_BUSY = 4,
+       RBBM_PC_VSD_BUSY = 5,
+       RBBM_VFD_BUSY = 6,
+       RBBM_VPC_BUSY = 7,
+       RBBM_UCHE_BUSY = 8,
+       RBBM_VSC_BUSY = 9,
+       RBBM_HLSQ_BUSY = 10,
+       RBBM_ANY_RB_BUSY = 11,
+       RBBM_ANY_TPL1_BUSY = 12,
+       RBBM_ANY_SP_BUSY = 13,
+       RBBM_ANY_MARB_BUSY = 14,
+       RBBM_ANY_ARB_BUSY = 15,
+       RBBM_AHB_STATUS_BUSY = 16,
+       RBBM_AHB_STATUS_STALLED = 17,
+       RBBM_AHB_STATUS_TXFR = 18,
+       RBBM_AHB_STATUS_TXFR_SPLIT = 19,
+       RBBM_AHB_STATUS_TXFR_ERROR = 20,
+       RBBM_AHB_STATUS_LONG_STALL = 21,
+       RBBM_STATUS_MASKED = 22,
+       RBBM_CP_BUSY_GFX_CORE_IDLE = 23,
+       RBBM_TESS_BUSY = 24,
+       RBBM_COM_BUSY = 25,
+       RBBM_DCOM_BUSY = 32,
+       RBBM_ANY_CCU_BUSY = 33,
+       RBBM_DPM_BUSY = 34,
+};
+
+enum a4xx_sp_perfcounter_select {
+       SP_LM_LOAD_INSTRUCTIONS = 0,
+       SP_LM_STORE_INSTRUCTIONS = 1,
+       SP_LM_ATOMICS = 2,
+       SP_GM_LOAD_INSTRUCTIONS = 3,
+       SP_GM_STORE_INSTRUCTIONS = 4,
+       SP_GM_ATOMICS = 5,
+       SP_VS_STAGE_TEX_INSTRUCTIONS = 6,
+       SP_VS_STAGE_CFLOW_INSTRUCTIONS = 7,
+       SP_VS_STAGE_EFU_INSTRUCTIONS = 8,
+       SP_VS_STAGE_FULL_ALU_INSTRUCTIONS = 9,
+       SP_VS_STAGE_HALF_ALU_INSTRUCTIONS = 10,
+       SP_FS_STAGE_TEX_INSTRUCTIONS = 11,
+       SP_FS_STAGE_CFLOW_INSTRUCTIONS = 12,
+       SP_FS_STAGE_EFU_INSTRUCTIONS = 13,
+       SP_FS_STAGE_FULL_ALU_INSTRUCTIONS = 14,
+       SP_FS_STAGE_HALF_ALU_INSTRUCTIONS = 15,
+       SP_VS_INSTRUCTIONS = 17,
+       SP_FS_INSTRUCTIONS = 18,
+       SP_ADDR_LOCK_COUNT = 19,
+       SP_UCHE_READ_TRANS = 20,
+       SP_UCHE_WRITE_TRANS = 21,
+       SP_EXPORT_VPC_TRANS = 22,
+       SP_EXPORT_RB_TRANS = 23,
+       SP_PIXELS_KILLED = 24,
+       SP_ICL1_REQUESTS = 25,
+       SP_ICL1_MISSES = 26,
+       SP_ICL0_REQUESTS = 27,
+       SP_ICL0_MISSES = 28,
+       SP_ALU_WORKING_CYCLES = 29,
+       SP_EFU_WORKING_CYCLES = 30,
+       SP_STALL_CYCLES_BY_VPC = 31,
+       SP_STALL_CYCLES_BY_TP = 32,
+       SP_STALL_CYCLES_BY_UCHE = 33,
+       SP_STALL_CYCLES_BY_RB = 34,
+       SP_BUSY_CYCLES = 35,
+       SP_HS_INSTRUCTIONS = 36,
+       SP_DS_INSTRUCTIONS = 37,
+       SP_GS_INSTRUCTIONS = 38,
+       SP_CS_INSTRUCTIONS = 39,
+       SP_SCHEDULER_NON_WORKING = 40,
+       SP_WAVE_CONTEXTS = 41,
+       SP_WAVE_CONTEXT_CYCLES = 42,
+       SP_POWER0 = 43,
+       SP_POWER1 = 44,
+       SP_POWER2 = 45,
+       SP_POWER3 = 46,
+       SP_POWER4 = 47,
+       SP_POWER5 = 48,
+       SP_POWER6 = 49,
+       SP_POWER7 = 50,
+       SP_POWER8 = 51,
+       SP_POWER9 = 52,
+       SP_POWER10 = 53,
+       SP_POWER11 = 54,
+       SP_POWER12 = 55,
+       SP_POWER13 = 56,
+       SP_POWER14 = 57,
+       SP_POWER15 = 58,
+};
+
+enum a4xx_tp_perfcounter_select {
+       TP_L1_REQUESTS = 0,
+       TP_L1_MISSES = 1,
+       TP_QUADS_OFFSET = 8,
+       TP_QUAD_SHADOW = 9,
+       TP_QUADS_ARRAY = 10,
+       TP_QUADS_GRADIENT = 11,
+       TP_QUADS_1D2D = 12,
+       TP_QUADS_3DCUBE = 13,
+       TP_BUSY_CYCLES = 16,
+       TP_STALL_CYCLES_BY_ARB = 17,
+       TP_STATE_CACHE_REQUESTS = 20,
+       TP_STATE_CACHE_MISSES = 21,
+       TP_POWER0 = 22,
+       TP_POWER1 = 23,
+       TP_POWER2 = 24,
+       TP_POWER3 = 25,
+       TP_POWER4 = 26,
+       TP_POWER5 = 27,
+       TP_POWER6 = 28,
+       TP_POWER7 = 29,
+};
+
+enum a4xx_uche_perfcounter_select {
+       UCHE_VBIF_READ_BEATS_TP = 0,
+       UCHE_VBIF_READ_BEATS_VFD = 1,
+       UCHE_VBIF_READ_BEATS_HLSQ = 2,
+       UCHE_VBIF_READ_BEATS_MARB = 3,
+       UCHE_VBIF_READ_BEATS_SP = 4,
+       UCHE_READ_REQUESTS_TP = 5,
+       UCHE_READ_REQUESTS_VFD = 6,
+       UCHE_READ_REQUESTS_HLSQ = 7,
+       UCHE_READ_REQUESTS_MARB = 8,
+       UCHE_READ_REQUESTS_SP = 9,
+       UCHE_WRITE_REQUESTS_MARB = 10,
+       UCHE_WRITE_REQUESTS_SP = 11,
+       UCHE_TAG_CHECK_FAILS = 12,
+       UCHE_EVICTS = 13,
+       UCHE_FLUSHES = 14,
+       UCHE_VBIF_LATENCY_CYCLES = 15,
+       UCHE_VBIF_LATENCY_SAMPLES = 16,
+       UCHE_BUSY_CYCLES = 17,
+       UCHE_VBIF_READ_BEATS_PC = 18,
+       UCHE_READ_REQUESTS_PC = 19,
+       UCHE_WRITE_REQUESTS_VPC = 20,
+       UCHE_STALL_BY_VBIF = 21,
+       UCHE_WRITE_REQUESTS_VSC = 22,
+       UCHE_POWER0 = 23,
+       UCHE_POWER1 = 24,
+       UCHE_POWER2 = 25,
+       UCHE_POWER3 = 26,
+       UCHE_POWER4 = 27,
+       UCHE_POWER5 = 28,
+       UCHE_POWER6 = 29,
+       UCHE_POWER7 = 30,
+};
+
+enum a4xx_vbif_perfcounter_select {
+       AXI_READ_REQUESTS_ID_0 = 0,
+       AXI_READ_REQUESTS_ID_1 = 1,
+       AXI_READ_REQUESTS_ID_2 = 2,
+       AXI_READ_REQUESTS_ID_3 = 3,
+       AXI_READ_REQUESTS_ID_4 = 4,
+       AXI_READ_REQUESTS_ID_5 = 5,
+       AXI_READ_REQUESTS_ID_6 = 6,
+       AXI_READ_REQUESTS_ID_7 = 7,
+       AXI_READ_REQUESTS_ID_8 = 8,
+       AXI_READ_REQUESTS_ID_9 = 9,
+       AXI_READ_REQUESTS_ID_10 = 10,
+       AXI_READ_REQUESTS_ID_11 = 11,
+       AXI_READ_REQUESTS_ID_12 = 12,
+       AXI_READ_REQUESTS_ID_13 = 13,
+       AXI_READ_REQUESTS_ID_14 = 14,
+       AXI_READ_REQUESTS_ID_15 = 15,
+       AXI0_READ_REQUESTS_TOTAL = 16,
+       AXI1_READ_REQUESTS_TOTAL = 17,
+       AXI2_READ_REQUESTS_TOTAL = 18,
+       AXI3_READ_REQUESTS_TOTAL = 19,
+       AXI_READ_REQUESTS_TOTAL = 20,
+       AXI_WRITE_REQUESTS_ID_0 = 21,
+       AXI_WRITE_REQUESTS_ID_1 = 22,
+       AXI_WRITE_REQUESTS_ID_2 = 23,
+       AXI_WRITE_REQUESTS_ID_3 = 24,
+       AXI_WRITE_REQUESTS_ID_4 = 25,
+       AXI_WRITE_REQUESTS_ID_5 = 26,
+       AXI_WRITE_REQUESTS_ID_6 = 27,
+       AXI_WRITE_REQUESTS_ID_7 = 28,
+       AXI_WRITE_REQUESTS_ID_8 = 29,
+       AXI_WRITE_REQUESTS_ID_9 = 30,
+       AXI_WRITE_REQUESTS_ID_10 = 31,
+       AXI_WRITE_REQUESTS_ID_11 = 32,
+       AXI_WRITE_REQUESTS_ID_12 = 33,
+       AXI_WRITE_REQUESTS_ID_13 = 34,
+       AXI_WRITE_REQUESTS_ID_14 = 35,
+       AXI_WRITE_REQUESTS_ID_15 = 36,
+       AXI0_WRITE_REQUESTS_TOTAL = 37,
+       AXI1_WRITE_REQUESTS_TOTAL = 38,
+       AXI2_WRITE_REQUESTS_TOTAL = 39,
+       AXI3_WRITE_REQUESTS_TOTAL = 40,
+       AXI_WRITE_REQUESTS_TOTAL = 41,
+       AXI_TOTAL_REQUESTS = 42,
+       AXI_READ_DATA_BEATS_ID_0 = 43,
+       AXI_READ_DATA_BEATS_ID_1 = 44,
+       AXI_READ_DATA_BEATS_ID_2 = 45,
+       AXI_READ_DATA_BEATS_ID_3 = 46,
+       AXI_READ_DATA_BEATS_ID_4 = 47,
+       AXI_READ_DATA_BEATS_ID_5 = 48,
+       AXI_READ_DATA_BEATS_ID_6 = 49,
+       AXI_READ_DATA_BEATS_ID_7 = 50,
+       AXI_READ_DATA_BEATS_ID_8 = 51,
+       AXI_READ_DATA_BEATS_ID_9 = 52,
+       AXI_READ_DATA_BEATS_ID_10 = 53,
+       AXI_READ_DATA_BEATS_ID_11 = 54,
+       AXI_READ_DATA_BEATS_ID_12 = 55,
+       AXI_READ_DATA_BEATS_ID_13 = 56,
+       AXI_READ_DATA_BEATS_ID_14 = 57,
+       AXI_READ_DATA_BEATS_ID_15 = 58,
+       AXI0_READ_DATA_BEATS_TOTAL = 59,
+       AXI1_READ_DATA_BEATS_TOTAL = 60,
+       AXI2_READ_DATA_BEATS_TOTAL = 61,
+       AXI3_READ_DATA_BEATS_TOTAL = 62,
+       AXI_READ_DATA_BEATS_TOTAL = 63,
+       AXI_WRITE_DATA_BEATS_ID_0 = 64,
+       AXI_WRITE_DATA_BEATS_ID_1 = 65,
+       AXI_WRITE_DATA_BEATS_ID_2 = 66,
+       AXI_WRITE_DATA_BEATS_ID_3 = 67,
+       AXI_WRITE_DATA_BEATS_ID_4 = 68,
+       AXI_WRITE_DATA_BEATS_ID_5 = 69,
+       AXI_WRITE_DATA_BEATS_ID_6 = 70,
+       AXI_WRITE_DATA_BEATS_ID_7 = 71,
+       AXI_WRITE_DATA_BEATS_ID_8 = 72,
+       AXI_WRITE_DATA_BEATS_ID_9 = 73,
+       AXI_WRITE_DATA_BEATS_ID_10 = 74,
+       AXI_WRITE_DATA_BEATS_ID_11 = 75,
+       AXI_WRITE_DATA_BEATS_ID_12 = 76,
+       AXI_WRITE_DATA_BEATS_ID_13 = 77,
+       AXI_WRITE_DATA_BEATS_ID_14 = 78,
+       AXI_WRITE_DATA_BEATS_ID_15 = 79,
+       AXI0_WRITE_DATA_BEATS_TOTAL = 80,
+       AXI1_WRITE_DATA_BEATS_TOTAL = 81,
+       AXI2_WRITE_DATA_BEATS_TOTAL = 82,
+       AXI3_WRITE_DATA_BEATS_TOTAL = 83,
+       AXI_WRITE_DATA_BEATS_TOTAL = 84,
+       AXI_DATA_BEATS_TOTAL = 85,
+       CYCLES_HELD_OFF_ID_0 = 86,
+       CYCLES_HELD_OFF_ID_1 = 87,
+       CYCLES_HELD_OFF_ID_2 = 88,
+       CYCLES_HELD_OFF_ID_3 = 89,
+       CYCLES_HELD_OFF_ID_4 = 90,
+       CYCLES_HELD_OFF_ID_5 = 91,
+       CYCLES_HELD_OFF_ID_6 = 92,
+       CYCLES_HELD_OFF_ID_7 = 93,
+       CYCLES_HELD_OFF_ID_8 = 94,
+       CYCLES_HELD_OFF_ID_9 = 95,
+       CYCLES_HELD_OFF_ID_10 = 96,
+       CYCLES_HELD_OFF_ID_11 = 97,
+       CYCLES_HELD_OFF_ID_12 = 98,
+       CYCLES_HELD_OFF_ID_13 = 99,
+       CYCLES_HELD_OFF_ID_14 = 100,
+       CYCLES_HELD_OFF_ID_15 = 101,
+       AXI_READ_REQUEST_HELD_OFF = 102,
+       AXI_WRITE_REQUEST_HELD_OFF = 103,
+       AXI_REQUEST_HELD_OFF = 104,
+       AXI_WRITE_DATA_HELD_OFF = 105,
+       OCMEM_AXI_READ_REQUEST_HELD_OFF = 106,
+       OCMEM_AXI_WRITE_REQUEST_HELD_OFF = 107,
+       OCMEM_AXI_REQUEST_HELD_OFF = 108,
+       OCMEM_AXI_WRITE_DATA_HELD_OFF = 109,
+       ELAPSED_CYCLES_DDR = 110,
+       ELAPSED_CYCLES_OCMEM = 111,
+};
+
+enum a4xx_vfd_perfcounter_select {
+       VFD_UCHE_BYTE_FETCHED = 0,
+       VFD_UCHE_TRANS = 1,
+       VFD_FETCH_INSTRUCTIONS = 3,
+       VFD_BUSY_CYCLES = 5,
+       VFD_STALL_CYCLES_UCHE = 6,
+       VFD_STALL_CYCLES_HLSQ = 7,
+       VFD_STALL_CYCLES_VPC_BYPASS = 8,
+       VFD_STALL_CYCLES_VPC_ALLOC = 9,
+       VFD_MODE_0_FIBERS = 13,
+       VFD_MODE_1_FIBERS = 14,
+       VFD_MODE_2_FIBERS = 15,
+       VFD_MODE_3_FIBERS = 16,
+       VFD_MODE_4_FIBERS = 17,
+       VFD_BFIFO_STALL = 18,
+       VFD_NUM_VERTICES_TOTAL = 19,
+       VFD_PACKER_FULL = 20,
+       VFD_UCHE_REQUEST_FIFO_FULL = 21,
+       VFD_STARVE_CYCLES_PC = 22,
+       VFD_STARVE_CYCLES_UCHE = 23,
+};
+
+enum a4xx_vpc_perfcounter_select {
+       VPC_SP_LM_COMPONENTS = 2,
+       VPC_SP0_LM_BYTES = 3,
+       VPC_SP1_LM_BYTES = 4,
+       VPC_SP2_LM_BYTES = 5,
+       VPC_SP3_LM_BYTES = 6,
+       VPC_WORKING_CYCLES = 7,
+       VPC_STALL_CYCLES_LM = 8,
+       VPC_STARVE_CYCLES_RAS = 9,
+       VPC_STREAMOUT_CYCLES = 10,
+       VPC_UCHE_TRANSACTIONS = 12,
+       VPC_STALL_CYCLES_UCHE = 13,
+       VPC_BUSY_CYCLES = 14,
+       VPC_STARVE_CYCLES_SP = 15,
+};
+
+enum a4xx_vsc_perfcounter_select {
+       VSC_BUSY_CYCLES = 0,
+       VSC_WORKING_CYCLES = 1,
+       VSC_STALL_CYCLES_UCHE = 2,
+       VSC_STARVE_CYCLES_RAS = 3,
+       VSC_EOT_NUM = 4,
+};
+
 enum a4xx_tex_filter {
        A4XX_TEX_NEAREST = 0,
        A4XX_TEX_LINEAR = 1,
@@ -348,6 +894,12 @@ static inline uint32_t A4XX_CGC_HLSQ_EARLY_CYC(uint32_t val)
 
 #define REG_A4XX_RB_PERFCTR_RB_SEL_7                           0x00000cce
 
+#define REG_A4XX_RB_PERFCTR_CCU_SEL_0                          0x00000ccf
+
+#define REG_A4XX_RB_PERFCTR_CCU_SEL_1                          0x00000cd0
+
+#define REG_A4XX_RB_PERFCTR_CCU_SEL_2                          0x00000cd1
+
 #define REG_A4XX_RB_PERFCTR_CCU_SEL_3                          0x00000cd2
 
 #define REG_A4XX_RB_FRAME_BUFFER_DIMENSION                     0x00000ce0
@@ -377,14 +929,17 @@ static inline uint32_t A4XX_RB_FRAME_BUFFER_DIMENSION_HEIGHT(uint32_t val)
 #define A4XX_RB_MODE_CONTROL_WIDTH__SHIFT                      0
 static inline uint32_t A4XX_RB_MODE_CONTROL_WIDTH(uint32_t val)
 {
+       assert(!(val & 0x1f));
        return ((val >> 5) << A4XX_RB_MODE_CONTROL_WIDTH__SHIFT) & A4XX_RB_MODE_CONTROL_WIDTH__MASK;
 }
 #define A4XX_RB_MODE_CONTROL_HEIGHT__MASK                      0x00003f00
 #define A4XX_RB_MODE_CONTROL_HEIGHT__SHIFT                     8
 static inline uint32_t A4XX_RB_MODE_CONTROL_HEIGHT(uint32_t val)
 {
+       assert(!(val & 0x1f));
        return ((val >> 5) << A4XX_RB_MODE_CONTROL_HEIGHT__SHIFT) & A4XX_RB_MODE_CONTROL_HEIGHT__MASK;
 }
+#define A4XX_RB_MODE_CONTROL_ENABLE_GMEM                       0x00010000
 
 #define REG_A4XX_RB_RENDER_CONTROL                             0x000020a1
 #define A4XX_RB_RENDER_CONTROL_BINNING_PASS                    0x00000001
@@ -466,6 +1021,7 @@ static inline uint32_t A4XX_RB_MRT_BUF_INFO_COLOR_SWAP(enum a3xx_color_swap val)
 #define A4XX_RB_MRT_BUF_INFO_COLOR_BUF_PITCH__SHIFT            14
 static inline uint32_t A4XX_RB_MRT_BUF_INFO_COLOR_BUF_PITCH(uint32_t val)
 {
+       assert(!(val & 0xf));
        return ((val >> 4) << A4XX_RB_MRT_BUF_INFO_COLOR_BUF_PITCH__SHIFT) & A4XX_RB_MRT_BUF_INFO_COLOR_BUF_PITCH__MASK;
 }
 
@@ -488,7 +1044,7 @@ static inline uint32_t A4XX_RB_MRT_BLEND_CONTROL_RGB_SRC_FACTOR(enum adreno_rb_b
 }
 #define A4XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE__MASK       0x000000e0
 #define A4XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE__SHIFT      5
-static inline uint32_t A4XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE(enum a4xx_rb_blend_opcode val)
+static inline uint32_t A4XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE(enum a3xx_rb_blend_opcode val)
 {
        return ((val) << A4XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE__SHIFT) & A4XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE__MASK;
 }
@@ -506,7 +1062,7 @@ static inline uint32_t A4XX_RB_MRT_BLEND_CONTROL_ALPHA_SRC_FACTOR(enum adreno_rb
 }
 #define A4XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE__MASK     0x00e00000
 #define A4XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE__SHIFT    21
-static inline uint32_t A4XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE(enum a4xx_rb_blend_opcode val)
+static inline uint32_t A4XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE(enum a3xx_rb_blend_opcode val)
 {
        return ((val) << A4XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE__SHIFT) & A4XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE__MASK;
 }
@@ -518,12 +1074,18 @@ static inline uint32_t A4XX_RB_MRT_BLEND_CONTROL_ALPHA_DEST_FACTOR(enum adreno_r
 }
 
 #define REG_A4XX_RB_BLEND_RED                                  0x000020f0
-#define A4XX_RB_BLEND_RED_UINT__MASK                           0x0000ffff
+#define A4XX_RB_BLEND_RED_UINT__MASK                           0x000000ff
 #define A4XX_RB_BLEND_RED_UINT__SHIFT                          0
 static inline uint32_t A4XX_RB_BLEND_RED_UINT(uint32_t val)
 {
        return ((val) << A4XX_RB_BLEND_RED_UINT__SHIFT) & A4XX_RB_BLEND_RED_UINT__MASK;
 }
+#define A4XX_RB_BLEND_RED_SINT__MASK                           0x0000ff00
+#define A4XX_RB_BLEND_RED_SINT__SHIFT                          8
+static inline uint32_t A4XX_RB_BLEND_RED_SINT(uint32_t val)
+{
+       return ((val) << A4XX_RB_BLEND_RED_SINT__SHIFT) & A4XX_RB_BLEND_RED_SINT__MASK;
+}
 #define A4XX_RB_BLEND_RED_FLOAT__MASK                          0xffff0000
 #define A4XX_RB_BLEND_RED_FLOAT__SHIFT                         16
 static inline uint32_t A4XX_RB_BLEND_RED_FLOAT(float val)
@@ -540,12 +1102,18 @@ static inline uint32_t A4XX_RB_BLEND_RED_F32(float val)
 }
 
 #define REG_A4XX_RB_BLEND_GREEN                                        0x000020f2
-#define A4XX_RB_BLEND_GREEN_UINT__MASK                         0x0000ffff
+#define A4XX_RB_BLEND_GREEN_UINT__MASK                         0x000000ff
 #define A4XX_RB_BLEND_GREEN_UINT__SHIFT                                0
 static inline uint32_t A4XX_RB_BLEND_GREEN_UINT(uint32_t val)
 {
        return ((val) << A4XX_RB_BLEND_GREEN_UINT__SHIFT) & A4XX_RB_BLEND_GREEN_UINT__MASK;
 }
+#define A4XX_RB_BLEND_GREEN_SINT__MASK                         0x0000ff00
+#define A4XX_RB_BLEND_GREEN_SINT__SHIFT                                8
+static inline uint32_t A4XX_RB_BLEND_GREEN_SINT(uint32_t val)
+{
+       return ((val) << A4XX_RB_BLEND_GREEN_SINT__SHIFT) & A4XX_RB_BLEND_GREEN_SINT__MASK;
+}
 #define A4XX_RB_BLEND_GREEN_FLOAT__MASK                                0xffff0000
 #define A4XX_RB_BLEND_GREEN_FLOAT__SHIFT                       16
 static inline uint32_t A4XX_RB_BLEND_GREEN_FLOAT(float val)
@@ -562,12 +1130,18 @@ static inline uint32_t A4XX_RB_BLEND_GREEN_F32(float val)
 }
 
 #define REG_A4XX_RB_BLEND_BLUE                                 0x000020f4
-#define A4XX_RB_BLEND_BLUE_UINT__MASK                          0x0000ffff
+#define A4XX_RB_BLEND_BLUE_UINT__MASK                          0x000000ff
 #define A4XX_RB_BLEND_BLUE_UINT__SHIFT                         0
 static inline uint32_t A4XX_RB_BLEND_BLUE_UINT(uint32_t val)
 {
        return ((val) << A4XX_RB_BLEND_BLUE_UINT__SHIFT) & A4XX_RB_BLEND_BLUE_UINT__MASK;
 }
+#define A4XX_RB_BLEND_BLUE_SINT__MASK                          0x0000ff00
+#define A4XX_RB_BLEND_BLUE_SINT__SHIFT                         8
+static inline uint32_t A4XX_RB_BLEND_BLUE_SINT(uint32_t val)
+{
+       return ((val) << A4XX_RB_BLEND_BLUE_SINT__SHIFT) & A4XX_RB_BLEND_BLUE_SINT__MASK;
+}
 #define A4XX_RB_BLEND_BLUE_FLOAT__MASK                         0xffff0000
 #define A4XX_RB_BLEND_BLUE_FLOAT__SHIFT                                16
 static inline uint32_t A4XX_RB_BLEND_BLUE_FLOAT(float val)
@@ -584,12 +1158,18 @@ static inline uint32_t A4XX_RB_BLEND_BLUE_F32(float val)
 }
 
 #define REG_A4XX_RB_BLEND_ALPHA                                        0x000020f6
-#define A4XX_RB_BLEND_ALPHA_UINT__MASK                         0x0000ffff
+#define A4XX_RB_BLEND_ALPHA_UINT__MASK                         0x000000ff
 #define A4XX_RB_BLEND_ALPHA_UINT__SHIFT                                0
 static inline uint32_t A4XX_RB_BLEND_ALPHA_UINT(uint32_t val)
 {
        return ((val) << A4XX_RB_BLEND_ALPHA_UINT__SHIFT) & A4XX_RB_BLEND_ALPHA_UINT__MASK;
 }
+#define A4XX_RB_BLEND_ALPHA_SINT__MASK                         0x0000ff00
+#define A4XX_RB_BLEND_ALPHA_SINT__SHIFT                                8
+static inline uint32_t A4XX_RB_BLEND_ALPHA_SINT(uint32_t val)
+{
+       return ((val) << A4XX_RB_BLEND_ALPHA_SINT__SHIFT) & A4XX_RB_BLEND_ALPHA_SINT__MASK;
+}
 #define A4XX_RB_BLEND_ALPHA_FLOAT__MASK                                0xffff0000
 #define A4XX_RB_BLEND_ALPHA_FLOAT__SHIFT                       16
 static inline uint32_t A4XX_RB_BLEND_ALPHA_FLOAT(float val)
@@ -627,7 +1207,7 @@ static inline uint32_t A4XX_RB_FS_OUTPUT_ENABLE_BLEND(uint32_t val)
 {
        return ((val) << A4XX_RB_FS_OUTPUT_ENABLE_BLEND__SHIFT) & A4XX_RB_FS_OUTPUT_ENABLE_BLEND__MASK;
 }
-#define A4XX_RB_FS_OUTPUT_FAST_CLEAR                           0x00000100
+#define A4XX_RB_FS_OUTPUT_INDEPENDENT_BLEND                    0x00000100
 #define A4XX_RB_FS_OUTPUT_SAMPLE_MASK__MASK                    0xffff0000
 #define A4XX_RB_FS_OUTPUT_SAMPLE_MASK__SHIFT                   16
 static inline uint32_t A4XX_RB_FS_OUTPUT_SAMPLE_MASK(uint32_t val)
@@ -641,6 +1221,7 @@ static inline uint32_t A4XX_RB_FS_OUTPUT_SAMPLE_MASK(uint32_t val)
 #define A4XX_RB_SAMPLE_COUNT_CONTROL_ADDR__SHIFT               2
 static inline uint32_t A4XX_RB_SAMPLE_COUNT_CONTROL_ADDR(uint32_t val)
 {
+       assert(!(val & 0x3));
        return ((val >> 2) << A4XX_RB_SAMPLE_COUNT_CONTROL_ADDR__SHIFT) & A4XX_RB_SAMPLE_COUNT_CONTROL_ADDR__MASK;
 }
 
@@ -717,6 +1298,7 @@ static inline uint32_t A4XX_RB_COPY_CONTROL_FASTCLEAR(uint32_t val)
 #define A4XX_RB_COPY_CONTROL_GMEM_BASE__SHIFT                  14
 static inline uint32_t A4XX_RB_COPY_CONTROL_GMEM_BASE(uint32_t val)
 {
+       assert(!(val & 0x3fff));
        return ((val >> 14) << A4XX_RB_COPY_CONTROL_GMEM_BASE__SHIFT) & A4XX_RB_COPY_CONTROL_GMEM_BASE__MASK;
 }
 
@@ -725,6 +1307,7 @@ static inline uint32_t A4XX_RB_COPY_CONTROL_GMEM_BASE(uint32_t val)
 #define A4XX_RB_COPY_DEST_BASE_BASE__SHIFT                     5
 static inline uint32_t A4XX_RB_COPY_DEST_BASE_BASE(uint32_t val)
 {
+       assert(!(val & 0x1f));
        return ((val >> 5) << A4XX_RB_COPY_DEST_BASE_BASE__SHIFT) & A4XX_RB_COPY_DEST_BASE_BASE__MASK;
 }
 
@@ -733,6 +1316,7 @@ static inline uint32_t A4XX_RB_COPY_DEST_BASE_BASE(uint32_t val)
 #define A4XX_RB_COPY_DEST_PITCH_PITCH__SHIFT                   0
 static inline uint32_t A4XX_RB_COPY_DEST_PITCH_PITCH(uint32_t val)
 {
+       assert(!(val & 0x1f));
        return ((val >> 5) << A4XX_RB_COPY_DEST_PITCH_PITCH__SHIFT) & A4XX_RB_COPY_DEST_PITCH_PITCH__MASK;
 }
 
@@ -793,8 +1377,9 @@ static inline uint32_t A4XX_RB_DEPTH_CONTROL_ZFUNC(enum adreno_compare_func val)
 {
        return ((val) << A4XX_RB_DEPTH_CONTROL_ZFUNC__SHIFT) & A4XX_RB_DEPTH_CONTROL_ZFUNC__MASK;
 }
-#define A4XX_RB_DEPTH_CONTROL_BF_ENABLE                                0x00000080
+#define A4XX_RB_DEPTH_CONTROL_Z_CLAMP_ENABLE                   0x00000080
 #define A4XX_RB_DEPTH_CONTROL_EARLY_Z_DISABLE                  0x00010000
+#define A4XX_RB_DEPTH_CONTROL_FORCE_FRAGZ_TO_FS                        0x00020000
 #define A4XX_RB_DEPTH_CONTROL_Z_TEST_ENABLE                    0x80000000
 
 #define REG_A4XX_RB_DEPTH_CLEAR                                        0x00002102
@@ -810,6 +1395,7 @@ static inline uint32_t A4XX_RB_DEPTH_INFO_DEPTH_FORMAT(enum a4xx_depth_format va
 #define A4XX_RB_DEPTH_INFO_DEPTH_BASE__SHIFT                   12
 static inline uint32_t A4XX_RB_DEPTH_INFO_DEPTH_BASE(uint32_t val)
 {
+       assert(!(val & 0xfff));
        return ((val >> 12) << A4XX_RB_DEPTH_INFO_DEPTH_BASE__SHIFT) & A4XX_RB_DEPTH_INFO_DEPTH_BASE__MASK;
 }
 
@@ -818,6 +1404,7 @@ static inline uint32_t A4XX_RB_DEPTH_INFO_DEPTH_BASE(uint32_t val)
 #define A4XX_RB_DEPTH_PITCH__SHIFT                             0
 static inline uint32_t A4XX_RB_DEPTH_PITCH(uint32_t val)
 {
+       assert(!(val & 0x1f));
        return ((val >> 5) << A4XX_RB_DEPTH_PITCH__SHIFT) & A4XX_RB_DEPTH_PITCH__MASK;
 }
 
@@ -826,6 +1413,7 @@ static inline uint32_t A4XX_RB_DEPTH_PITCH(uint32_t val)
 #define A4XX_RB_DEPTH_PITCH2__SHIFT                            0
 static inline uint32_t A4XX_RB_DEPTH_PITCH2(uint32_t val)
 {
+       assert(!(val & 0x1f));
        return ((val >> 5) << A4XX_RB_DEPTH_PITCH2__SHIFT) & A4XX_RB_DEPTH_PITCH2__MASK;
 }
 
@@ -891,6 +1479,7 @@ static inline uint32_t A4XX_RB_STENCIL_CONTROL_ZFAIL_BF(enum adreno_stencil_op v
 #define A4XX_RB_STENCIL_INFO_STENCIL_BASE__SHIFT               12
 static inline uint32_t A4XX_RB_STENCIL_INFO_STENCIL_BASE(uint32_t val)
 {
+       assert(!(val & 0xfff));
        return ((val >> 12) << A4XX_RB_STENCIL_INFO_STENCIL_BASE__SHIFT) & A4XX_RB_STENCIL_INFO_STENCIL_BASE__MASK;
 }
 
@@ -899,6 +1488,7 @@ static inline uint32_t A4XX_RB_STENCIL_INFO_STENCIL_BASE(uint32_t val)
 #define A4XX_RB_STENCIL_PITCH__SHIFT                           0
 static inline uint32_t A4XX_RB_STENCIL_PITCH(uint32_t val)
 {
+       assert(!(val & 0x1f));
        return ((val >> 5) << A4XX_RB_STENCIL_PITCH__SHIFT) & A4XX_RB_STENCIL_PITCH__MASK;
 }
 
@@ -1055,8 +1645,386 @@ static inline uint32_t REG_A4XX_RBBM_CLOCK_DELAY_TP_REG(uint32_t i0) { return 0x
 
 #define REG_A4XX_RBBM_CFG_DEBBUS_SEL_D                         0x0000004d
 
+#define REG_A4XX_RBBM_POWER_CNTL_IP                            0x00000098
+#define A4XX_RBBM_POWER_CNTL_IP_SW_COLLAPSE                    0x00000001
+#define A4XX_RBBM_POWER_CNTL_IP_SP_TP_PWR_ON                   0x00100000
+
 #define REG_A4XX_RBBM_PERFCTR_CP_0_LO                          0x0000009c
 
+#define REG_A4XX_RBBM_PERFCTR_CP_0_HI                          0x0000009d
+
+#define REG_A4XX_RBBM_PERFCTR_CP_1_LO                          0x0000009e
+
+#define REG_A4XX_RBBM_PERFCTR_CP_1_HI                          0x0000009f
+
+#define REG_A4XX_RBBM_PERFCTR_CP_2_LO                          0x000000a0
+
+#define REG_A4XX_RBBM_PERFCTR_CP_2_HI                          0x000000a1
+
+#define REG_A4XX_RBBM_PERFCTR_CP_3_LO                          0x000000a2
+
+#define REG_A4XX_RBBM_PERFCTR_CP_3_HI                          0x000000a3
+
+#define REG_A4XX_RBBM_PERFCTR_CP_4_LO                          0x000000a4
+
+#define REG_A4XX_RBBM_PERFCTR_CP_4_HI                          0x000000a5
+
+#define REG_A4XX_RBBM_PERFCTR_CP_5_LO                          0x000000a6
+
+#define REG_A4XX_RBBM_PERFCTR_CP_5_HI                          0x000000a7
+
+#define REG_A4XX_RBBM_PERFCTR_CP_6_LO                          0x000000a8
+
+#define REG_A4XX_RBBM_PERFCTR_CP_6_HI                          0x000000a9
+
+#define REG_A4XX_RBBM_PERFCTR_CP_7_LO                          0x000000aa
+
+#define REG_A4XX_RBBM_PERFCTR_CP_7_HI                          0x000000ab
+
+#define REG_A4XX_RBBM_PERFCTR_RBBM_0_LO                                0x000000ac
+
+#define REG_A4XX_RBBM_PERFCTR_RBBM_0_HI                                0x000000ad
+
+#define REG_A4XX_RBBM_PERFCTR_RBBM_1_LO                                0x000000ae
+
+#define REG_A4XX_RBBM_PERFCTR_RBBM_1_HI                                0x000000af
+
+#define REG_A4XX_RBBM_PERFCTR_RBBM_2_LO                                0x000000b0
+
+#define REG_A4XX_RBBM_PERFCTR_RBBM_2_HI                                0x000000b1
+
+#define REG_A4XX_RBBM_PERFCTR_RBBM_3_LO                                0x000000b2
+
+#define REG_A4XX_RBBM_PERFCTR_RBBM_3_HI                                0x000000b3
+
+#define REG_A4XX_RBBM_PERFCTR_PC_0_LO                          0x000000b4
+
+#define REG_A4XX_RBBM_PERFCTR_PC_0_HI                          0x000000b5
+
+#define REG_A4XX_RBBM_PERFCTR_PC_1_LO                          0x000000b6
+
+#define REG_A4XX_RBBM_PERFCTR_PC_1_HI                          0x000000b7
+
+#define REG_A4XX_RBBM_PERFCTR_PC_2_LO                          0x000000b8
+
+#define REG_A4XX_RBBM_PERFCTR_PC_2_HI                          0x000000b9
+
+#define REG_A4XX_RBBM_PERFCTR_PC_3_LO                          0x000000ba
+
+#define REG_A4XX_RBBM_PERFCTR_PC_3_HI                          0x000000bb
+
+#define REG_A4XX_RBBM_PERFCTR_PC_4_LO                          0x000000bc
+
+#define REG_A4XX_RBBM_PERFCTR_PC_4_HI                          0x000000bd
+
+#define REG_A4XX_RBBM_PERFCTR_PC_5_LO                          0x000000be
+
+#define REG_A4XX_RBBM_PERFCTR_PC_5_HI                          0x000000bf
+
+#define REG_A4XX_RBBM_PERFCTR_PC_6_LO                          0x000000c0
+
+#define REG_A4XX_RBBM_PERFCTR_PC_6_HI                          0x000000c1
+
+#define REG_A4XX_RBBM_PERFCTR_PC_7_LO                          0x000000c2
+
+#define REG_A4XX_RBBM_PERFCTR_PC_7_HI                          0x000000c3
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_0_LO                         0x000000c4
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_0_HI                         0x000000c5
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_1_LO                         0x000000c6
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_1_HI                         0x000000c7
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_2_LO                         0x000000c8
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_2_HI                         0x000000c9
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_3_LO                         0x000000ca
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_3_HI                         0x000000cb
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_4_LO                         0x000000cc
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_4_HI                         0x000000cd
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_5_LO                         0x000000ce
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_5_HI                         0x000000cf
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_6_LO                         0x000000d0
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_6_HI                         0x000000d1
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_7_LO                         0x000000d2
+
+#define REG_A4XX_RBBM_PERFCTR_VFD_7_HI                         0x000000d3
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_0_LO                                0x000000d4
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_0_HI                                0x000000d5
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_1_LO                                0x000000d6
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_1_HI                                0x000000d7
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_2_LO                                0x000000d8
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_2_HI                                0x000000d9
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_3_LO                                0x000000da
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_3_HI                                0x000000db
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_4_LO                                0x000000dc
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_4_HI                                0x000000dd
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_5_LO                                0x000000de
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_5_HI                                0x000000df
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_6_LO                                0x000000e0
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_6_HI                                0x000000e1
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_7_LO                                0x000000e2
+
+#define REG_A4XX_RBBM_PERFCTR_HLSQ_7_HI                                0x000000e3
+
+#define REG_A4XX_RBBM_PERFCTR_VPC_0_LO                         0x000000e4
+
+#define REG_A4XX_RBBM_PERFCTR_VPC_0_HI                         0x000000e5
+
+#define REG_A4XX_RBBM_PERFCTR_VPC_1_LO                         0x000000e6
+
+#define REG_A4XX_RBBM_PERFCTR_VPC_1_HI                         0x000000e7
+
+#define REG_A4XX_RBBM_PERFCTR_VPC_2_LO                         0x000000e8
+
+#define REG_A4XX_RBBM_PERFCTR_VPC_2_HI                         0x000000e9
+
+#define REG_A4XX_RBBM_PERFCTR_VPC_3_LO                         0x000000ea
+
+#define REG_A4XX_RBBM_PERFCTR_VPC_3_HI                         0x000000eb
+
+#define REG_A4XX_RBBM_PERFCTR_CCU_0_LO                         0x000000ec
+
+#define REG_A4XX_RBBM_PERFCTR_CCU_0_HI                         0x000000ed
+
+#define REG_A4XX_RBBM_PERFCTR_CCU_1_LO                         0x000000ee
+
+#define REG_A4XX_RBBM_PERFCTR_CCU_1_HI                         0x000000ef
+
+#define REG_A4XX_RBBM_PERFCTR_CCU_2_LO                         0x000000f0
+
+#define REG_A4XX_RBBM_PERFCTR_CCU_2_HI                         0x000000f1
+
+#define REG_A4XX_RBBM_PERFCTR_CCU_3_LO                         0x000000f2
+
+#define REG_A4XX_RBBM_PERFCTR_CCU_3_HI                         0x000000f3
+
+#define REG_A4XX_RBBM_PERFCTR_TSE_0_LO                         0x000000f4
+
+#define REG_A4XX_RBBM_PERFCTR_TSE_0_HI                         0x000000f5
+
+#define REG_A4XX_RBBM_PERFCTR_TSE_1_LO                         0x000000f6
+
+#define REG_A4XX_RBBM_PERFCTR_TSE_1_HI                         0x000000f7
+
+#define REG_A4XX_RBBM_PERFCTR_TSE_2_LO                         0x000000f8
+
+#define REG_A4XX_RBBM_PERFCTR_TSE_2_HI                         0x000000f9
+
+#define REG_A4XX_RBBM_PERFCTR_TSE_3_LO                         0x000000fa
+
+#define REG_A4XX_RBBM_PERFCTR_TSE_3_HI                         0x000000fb
+
+#define REG_A4XX_RBBM_PERFCTR_RAS_0_LO                         0x000000fc
+
+#define REG_A4XX_RBBM_PERFCTR_RAS_0_HI                         0x000000fd
+
+#define REG_A4XX_RBBM_PERFCTR_RAS_1_LO                         0x000000fe
+
+#define REG_A4XX_RBBM_PERFCTR_RAS_1_HI                         0x000000ff
+
+#define REG_A4XX_RBBM_PERFCTR_RAS_2_LO                         0x00000100
+
+#define REG_A4XX_RBBM_PERFCTR_RAS_2_HI                         0x00000101
+
+#define REG_A4XX_RBBM_PERFCTR_RAS_3_LO                         0x00000102
+
+#define REG_A4XX_RBBM_PERFCTR_RAS_3_HI                         0x00000103
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_0_LO                                0x00000104
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_0_HI                                0x00000105
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_1_LO                                0x00000106
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_1_HI                                0x00000107
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_2_LO                                0x00000108
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_2_HI                                0x00000109
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_3_LO                                0x0000010a
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_3_HI                                0x0000010b
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_4_LO                                0x0000010c
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_4_HI                                0x0000010d
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_5_LO                                0x0000010e
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_5_HI                                0x0000010f
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_6_LO                                0x00000110
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_6_HI                                0x00000111
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_7_LO                                0x00000112
+
+#define REG_A4XX_RBBM_PERFCTR_UCHE_7_HI                                0x00000113
+
+#define REG_A4XX_RBBM_PERFCTR_TP_0_LO                          0x00000114
+
+#define REG_A4XX_RBBM_PERFCTR_TP_0_HI                          0x00000115
+
+#define REG_A4XX_RBBM_PERFCTR_TP_0_LO                          0x00000114
+
+#define REG_A4XX_RBBM_PERFCTR_TP_0_HI                          0x00000115
+
+#define REG_A4XX_RBBM_PERFCTR_TP_1_LO                          0x00000116
+
+#define REG_A4XX_RBBM_PERFCTR_TP_1_HI                          0x00000117
+
+#define REG_A4XX_RBBM_PERFCTR_TP_2_LO                          0x00000118
+
+#define REG_A4XX_RBBM_PERFCTR_TP_2_HI                          0x00000119
+
+#define REG_A4XX_RBBM_PERFCTR_TP_3_LO                          0x0000011a
+
+#define REG_A4XX_RBBM_PERFCTR_TP_3_HI                          0x0000011b
+
+#define REG_A4XX_RBBM_PERFCTR_TP_4_LO                          0x0000011c
+
+#define REG_A4XX_RBBM_PERFCTR_TP_4_HI                          0x0000011d
+
+#define REG_A4XX_RBBM_PERFCTR_TP_5_LO                          0x0000011e
+
+#define REG_A4XX_RBBM_PERFCTR_TP_5_HI                          0x0000011f
+
+#define REG_A4XX_RBBM_PERFCTR_TP_6_LO                          0x00000120
+
+#define REG_A4XX_RBBM_PERFCTR_TP_6_HI                          0x00000121
+
+#define REG_A4XX_RBBM_PERFCTR_TP_7_LO                          0x00000122
+
+#define REG_A4XX_RBBM_PERFCTR_TP_7_HI                          0x00000123
+
+#define REG_A4XX_RBBM_PERFCTR_SP_0_LO                          0x00000124
+
+#define REG_A4XX_RBBM_PERFCTR_SP_0_HI                          0x00000125
+
+#define REG_A4XX_RBBM_PERFCTR_SP_1_LO                          0x00000126
+
+#define REG_A4XX_RBBM_PERFCTR_SP_1_HI                          0x00000127
+
+#define REG_A4XX_RBBM_PERFCTR_SP_2_LO                          0x00000128
+
+#define REG_A4XX_RBBM_PERFCTR_SP_2_HI                          0x00000129
+
+#define REG_A4XX_RBBM_PERFCTR_SP_3_LO                          0x0000012a
+
+#define REG_A4XX_RBBM_PERFCTR_SP_3_HI                          0x0000012b
+
+#define REG_A4XX_RBBM_PERFCTR_SP_4_LO                          0x0000012c
+
+#define REG_A4XX_RBBM_PERFCTR_SP_4_HI                          0x0000012d
+
+#define REG_A4XX_RBBM_PERFCTR_SP_5_LO                          0x0000012e
+
+#define REG_A4XX_RBBM_PERFCTR_SP_5_HI                          0x0000012f
+
+#define REG_A4XX_RBBM_PERFCTR_SP_6_LO                          0x00000130
+
+#define REG_A4XX_RBBM_PERFCTR_SP_6_HI                          0x00000131
+
+#define REG_A4XX_RBBM_PERFCTR_SP_7_LO                          0x00000132
+
+#define REG_A4XX_RBBM_PERFCTR_SP_7_HI                          0x00000133
+
+#define REG_A4XX_RBBM_PERFCTR_SP_8_LO                          0x00000134
+
+#define REG_A4XX_RBBM_PERFCTR_SP_8_HI                          0x00000135
+
+#define REG_A4XX_RBBM_PERFCTR_SP_9_LO                          0x00000136
+
+#define REG_A4XX_RBBM_PERFCTR_SP_9_HI                          0x00000137
+
+#define REG_A4XX_RBBM_PERFCTR_SP_10_LO                         0x00000138
+
+#define REG_A4XX_RBBM_PERFCTR_SP_10_HI                         0x00000139
+
+#define REG_A4XX_RBBM_PERFCTR_SP_11_LO                         0x0000013a
+
+#define REG_A4XX_RBBM_PERFCTR_SP_11_HI                         0x0000013b
+
+#define REG_A4XX_RBBM_PERFCTR_RB_0_LO                          0x0000013c
+
+#define REG_A4XX_RBBM_PERFCTR_RB_0_HI                          0x0000013d
+
+#define REG_A4XX_RBBM_PERFCTR_RB_1_LO                          0x0000013e
+
+#define REG_A4XX_RBBM_PERFCTR_RB_1_HI                          0x0000013f
+
+#define REG_A4XX_RBBM_PERFCTR_RB_2_LO                          0x00000140
+
+#define REG_A4XX_RBBM_PERFCTR_RB_2_HI                          0x00000141
+
+#define REG_A4XX_RBBM_PERFCTR_RB_3_LO                          0x00000142
+
+#define REG_A4XX_RBBM_PERFCTR_RB_3_HI                          0x00000143
+
+#define REG_A4XX_RBBM_PERFCTR_RB_4_LO                          0x00000144
+
+#define REG_A4XX_RBBM_PERFCTR_RB_4_HI                          0x00000145
+
+#define REG_A4XX_RBBM_PERFCTR_RB_5_LO                          0x00000146
+
+#define REG_A4XX_RBBM_PERFCTR_RB_5_HI                          0x00000147
+
+#define REG_A4XX_RBBM_PERFCTR_RB_6_LO                          0x00000148
+
+#define REG_A4XX_RBBM_PERFCTR_RB_6_HI                          0x00000149
+
+#define REG_A4XX_RBBM_PERFCTR_RB_7_LO                          0x0000014a
+
+#define REG_A4XX_RBBM_PERFCTR_RB_7_HI                          0x0000014b
+
+#define REG_A4XX_RBBM_PERFCTR_VSC_0_LO                         0x0000014c
+
+#define REG_A4XX_RBBM_PERFCTR_VSC_0_HI                         0x0000014d
+
+#define REG_A4XX_RBBM_PERFCTR_VSC_1_LO                         0x0000014e
+
+#define REG_A4XX_RBBM_PERFCTR_VSC_1_HI                         0x0000014f
+
+#define REG_A4XX_RBBM_PERFCTR_PWR_0_LO                         0x00000166
+
+#define REG_A4XX_RBBM_PERFCTR_PWR_0_HI                         0x00000167
+
+#define REG_A4XX_RBBM_PERFCTR_PWR_1_LO                         0x00000168
+
+#define REG_A4XX_RBBM_PERFCTR_PWR_1_HI                         0x00000169
+
+#define REG_A4XX_RBBM_ALWAYSON_COUNTER_LO                      0x0000016e
+
+#define REG_A4XX_RBBM_ALWAYSON_COUNTER_HI                      0x0000016f
+
 static inline uint32_t REG_A4XX_RBBM_CLOCK_CTL_SP(uint32_t i0) { return 0x00000068 + 0x1*i0; }
 
 static inline uint32_t REG_A4XX_RBBM_CLOCK_CTL_SP_REG(uint32_t i0) { return 0x00000068 + 0x1*i0; }
@@ -1105,6 +2073,10 @@ static inline uint32_t REG_A4XX_RBBM_CLOCK_DELAY_RB_MARB_CCU_L1(uint32_t i0) { r
 
 static inline uint32_t REG_A4XX_RBBM_CLOCK_DELAY_RB_MARB_CCU_L1_REG(uint32_t i0) { return 0x0000008e + 0x1*i0; }
 
+#define REG_A4XX_RBBM_SP_REGFILE_SLEEP_CNTL_0                  0x00000099
+
+#define REG_A4XX_RBBM_SP_REGFILE_SLEEP_CNTL_1                  0x0000009a
+
 #define REG_A4XX_RBBM_PERFCTR_PWR_1_LO                         0x00000168
 
 #define REG_A4XX_RBBM_PERFCTR_CTL                              0x00000170
@@ -1119,6 +2091,14 @@ static inline uint32_t REG_A4XX_RBBM_CLOCK_DELAY_RB_MARB_CCU_L1_REG(uint32_t i0)
 
 #define REG_A4XX_RBBM_PERFCTR_LOAD_VALUE_HI                    0x00000175
 
+#define REG_A4XX_RBBM_PERFCTR_RBBM_SEL_0                       0x00000176
+
+#define REG_A4XX_RBBM_PERFCTR_RBBM_SEL_1                       0x00000177
+
+#define REG_A4XX_RBBM_PERFCTR_RBBM_SEL_2                       0x00000178
+
+#define REG_A4XX_RBBM_PERFCTR_RBBM_SEL_3                       0x00000179
+
 #define REG_A4XX_RBBM_GPU_BUSY_MASKED                          0x0000017a
 
 #define REG_A4XX_RBBM_INT_0_STATUS                             0x0000017d
@@ -1158,6 +2138,11 @@ static inline uint32_t REG_A4XX_RBBM_CLOCK_DELAY_RB_MARB_CCU_L1_REG(uint32_t i0)
 
 #define REG_A4XX_RBBM_INTERFACE_RRDY_STATUS5                   0x0000019f
 
+#define REG_A4XX_RBBM_POWER_STATUS                             0x000001b0
+#define A4XX_RBBM_POWER_STATUS_SP_TP_PWR_ON                    0x00100000
+
+#define REG_A4XX_RBBM_WAIT_IDLE_CLOCKS_CTL2                    0x000001b8
+
 #define REG_A4XX_CP_SCRATCH_UMASK                              0x00000228
 
 #define REG_A4XX_CP_SCRATCH_ADDR                               0x00000229
@@ -1226,11 +2211,23 @@ static inline uint32_t REG_A4XX_RBBM_CLOCK_DELAY_RB_MARB_CCU_L1_REG(uint32_t i0)
 
 #define REG_A4XX_CP_DRAW_STATE_ADDR                            0x00000232
 
-#define REG_A4XX_CP_PROTECT_REG_0                              0x00000240
-
 static inline uint32_t REG_A4XX_CP_PROTECT(uint32_t i0) { return 0x00000240 + 0x1*i0; }
 
 static inline uint32_t REG_A4XX_CP_PROTECT_REG(uint32_t i0) { return 0x00000240 + 0x1*i0; }
+#define A4XX_CP_PROTECT_REG_BASE_ADDR__MASK                    0x0001ffff
+#define A4XX_CP_PROTECT_REG_BASE_ADDR__SHIFT                   0
+static inline uint32_t A4XX_CP_PROTECT_REG_BASE_ADDR(uint32_t val)
+{
+       return ((val) << A4XX_CP_PROTECT_REG_BASE_ADDR__SHIFT) & A4XX_CP_PROTECT_REG_BASE_ADDR__MASK;
+}
+#define A4XX_CP_PROTECT_REG_MASK_LEN__MASK                     0x1f000000
+#define A4XX_CP_PROTECT_REG_MASK_LEN__SHIFT                    24
+static inline uint32_t A4XX_CP_PROTECT_REG_MASK_LEN(uint32_t val)
+{
+       return ((val) << A4XX_CP_PROTECT_REG_MASK_LEN__SHIFT) & A4XX_CP_PROTECT_REG_MASK_LEN__MASK;
+}
+#define A4XX_CP_PROTECT_REG_TRAP_WRITE                         0x20000000
+#define A4XX_CP_PROTECT_REG_TRAP_READ                          0x40000000
 
 #define REG_A4XX_CP_PROTECT_CTRL                               0x00000250
 
@@ -1250,6 +2247,20 @@ static inline uint32_t REG_A4XX_CP_PROTECT_REG(uint32_t i0) { return 0x00000240
 
 #define REG_A4XX_CP_PERFCTR_CP_SEL_0                           0x00000500
 
+#define REG_A4XX_CP_PERFCTR_CP_SEL_1                           0x00000501
+
+#define REG_A4XX_CP_PERFCTR_CP_SEL_2                           0x00000502
+
+#define REG_A4XX_CP_PERFCTR_CP_SEL_3                           0x00000503
+
+#define REG_A4XX_CP_PERFCTR_CP_SEL_4                           0x00000504
+
+#define REG_A4XX_CP_PERFCTR_CP_SEL_5                           0x00000505
+
+#define REG_A4XX_CP_PERFCTR_CP_SEL_6                           0x00000506
+
+#define REG_A4XX_CP_PERFCTR_CP_SEL_7                           0x00000507
+
 #define REG_A4XX_CP_PERFCOMBINER_SELECT                                0x0000050b
 
 static inline uint32_t REG_A4XX_CP_SCRATCH(uint32_t i0) { return 0x00000578 + 0x1*i0; }
@@ -1260,6 +2271,28 @@ static inline uint32_t REG_A4XX_CP_SCRATCH_REG(uint32_t i0) { return 0x00000578
 
 #define REG_A4XX_SP_MODE_CONTROL                               0x00000ec3
 
+#define REG_A4XX_SP_PERFCTR_SP_SEL_0                           0x00000ec4
+
+#define REG_A4XX_SP_PERFCTR_SP_SEL_1                           0x00000ec5
+
+#define REG_A4XX_SP_PERFCTR_SP_SEL_2                           0x00000ec6
+
+#define REG_A4XX_SP_PERFCTR_SP_SEL_3                           0x00000ec7
+
+#define REG_A4XX_SP_PERFCTR_SP_SEL_4                           0x00000ec8
+
+#define REG_A4XX_SP_PERFCTR_SP_SEL_5                           0x00000ec9
+
+#define REG_A4XX_SP_PERFCTR_SP_SEL_6                           0x00000eca
+
+#define REG_A4XX_SP_PERFCTR_SP_SEL_7                           0x00000ecb
+
+#define REG_A4XX_SP_PERFCTR_SP_SEL_8                           0x00000ecc
+
+#define REG_A4XX_SP_PERFCTR_SP_SEL_9                           0x00000ecd
+
+#define REG_A4XX_SP_PERFCTR_SP_SEL_10                          0x00000ece
+
 #define REG_A4XX_SP_PERFCTR_SP_SEL_11                          0x00000ecf
 
 #define REG_A4XX_SP_SP_CTRL_REG                                        0x000022c0
@@ -1285,7 +2318,7 @@ static inline uint32_t A4XX_SP_VS_CTRL_REG0_HALFREGFOOTPRINT(uint32_t val)
 {
        return ((val) << A4XX_SP_VS_CTRL_REG0_HALFREGFOOTPRINT__SHIFT) & A4XX_SP_VS_CTRL_REG0_HALFREGFOOTPRINT__MASK;
 }
-#define A4XX_SP_VS_CTRL_REG0_FULLREGFOOTPRINT__MASK            0x0003fc00
+#define A4XX_SP_VS_CTRL_REG0_FULLREGFOOTPRINT__MASK            0x0000fc00
 #define A4XX_SP_VS_CTRL_REG0_FULLREGFOOTPRINT__SHIFT           10
 static inline uint32_t A4XX_SP_VS_CTRL_REG0_FULLREGFOOTPRINT(uint32_t val)
 {
@@ -1433,7 +2466,7 @@ static inline uint32_t A4XX_SP_FS_CTRL_REG0_HALFREGFOOTPRINT(uint32_t val)
 {
        return ((val) << A4XX_SP_FS_CTRL_REG0_HALFREGFOOTPRINT__SHIFT) & A4XX_SP_FS_CTRL_REG0_HALFREGFOOTPRINT__MASK;
 }
-#define A4XX_SP_FS_CTRL_REG0_FULLREGFOOTPRINT__MASK            0x0003fc00
+#define A4XX_SP_FS_CTRL_REG0_FULLREGFOOTPRINT__MASK            0x0000fc00
 #define A4XX_SP_FS_CTRL_REG0_FULLREGFOOTPRINT__SHIFT           10
 static inline uint32_t A4XX_SP_FS_CTRL_REG0_FULLREGFOOTPRINT(uint32_t val)
 {
@@ -1758,6 +2791,12 @@ static inline uint32_t A4XX_SP_GS_OBJ_OFFSET_REG_SHADEROBJOFFSET(uint32_t val)
 
 #define REG_A4XX_VPC_DEBUG_ECO_CONTROL                         0x00000e64
 
+#define REG_A4XX_VPC_PERFCTR_VPC_SEL_0                         0x00000e65
+
+#define REG_A4XX_VPC_PERFCTR_VPC_SEL_1                         0x00000e66
+
+#define REG_A4XX_VPC_PERFCTR_VPC_SEL_2                         0x00000e67
+
 #define REG_A4XX_VPC_PERFCTR_VPC_SEL_3                         0x00000e68
 
 #define REG_A4XX_VPC_ATTR                                      0x00002140
@@ -1811,12 +2850,14 @@ static inline uint32_t REG_A4XX_VPC_VARYING_PS_REPL_MODE(uint32_t i0) { return 0
 #define A4XX_VSC_BIN_SIZE_WIDTH__SHIFT                         0
 static inline uint32_t A4XX_VSC_BIN_SIZE_WIDTH(uint32_t val)
 {
+       assert(!(val & 0x1f));
        return ((val >> 5) << A4XX_VSC_BIN_SIZE_WIDTH__SHIFT) & A4XX_VSC_BIN_SIZE_WIDTH__MASK;
 }
 #define A4XX_VSC_BIN_SIZE_HEIGHT__MASK                         0x000003e0
 #define A4XX_VSC_BIN_SIZE_HEIGHT__SHIFT                                5
 static inline uint32_t A4XX_VSC_BIN_SIZE_HEIGHT(uint32_t val)
 {
+       assert(!(val & 0x1f));
        return ((val >> 5) << A4XX_VSC_BIN_SIZE_HEIGHT__SHIFT) & A4XX_VSC_BIN_SIZE_HEIGHT__MASK;
 }
 
@@ -1870,6 +2911,20 @@ static inline uint32_t REG_A4XX_VSC_PIPE_DATA_LENGTH_REG(uint32_t i0) { return 0
 
 #define REG_A4XX_VFD_DEBUG_CONTROL                             0x00000e40
 
+#define REG_A4XX_VFD_PERFCTR_VFD_SEL_0                         0x00000e43
+
+#define REG_A4XX_VFD_PERFCTR_VFD_SEL_1                         0x00000e44
+
+#define REG_A4XX_VFD_PERFCTR_VFD_SEL_2                         0x00000e45
+
+#define REG_A4XX_VFD_PERFCTR_VFD_SEL_3                         0x00000e46
+
+#define REG_A4XX_VFD_PERFCTR_VFD_SEL_4                         0x00000e47
+
+#define REG_A4XX_VFD_PERFCTR_VFD_SEL_5                         0x00000e48
+
+#define REG_A4XX_VFD_PERFCTR_VFD_SEL_6                         0x00000e49
+
 #define REG_A4XX_VFD_PERFCTR_VFD_SEL_7                         0x00000e4a
 
 #define REG_A4XX_VGT_CL_INITIATOR                              0x000021d0
@@ -1969,11 +3024,11 @@ static inline uint32_t A4XX_VFD_FETCH_INSTR_0_BUFSTRIDE(uint32_t val)
 static inline uint32_t REG_A4XX_VFD_FETCH_INSTR_1(uint32_t i0) { return 0x0000220b + 0x4*i0; }
 
 static inline uint32_t REG_A4XX_VFD_FETCH_INSTR_2(uint32_t i0) { return 0x0000220c + 0x4*i0; }
-#define A4XX_VFD_FETCH_INSTR_2_SIZE__MASK                      0xfffffff0
-#define A4XX_VFD_FETCH_INSTR_2_SIZE__SHIFT                     4
+#define A4XX_VFD_FETCH_INSTR_2_SIZE__MASK                      0xffffffff
+#define A4XX_VFD_FETCH_INSTR_2_SIZE__SHIFT                     0
 static inline uint32_t A4XX_VFD_FETCH_INSTR_2_SIZE(uint32_t val)
 {
-       return ((val >> 4) << A4XX_VFD_FETCH_INSTR_2_SIZE__SHIFT) & A4XX_VFD_FETCH_INSTR_2_SIZE__MASK;
+       return ((val) << A4XX_VFD_FETCH_INSTR_2_SIZE__SHIFT) & A4XX_VFD_FETCH_INSTR_2_SIZE__MASK;
 }
 
 static inline uint32_t REG_A4XX_VFD_FETCH_INSTR_3(uint32_t i0) { return 0x0000220d + 0x4*i0; }
@@ -2026,6 +3081,20 @@ static inline uint32_t A4XX_VFD_DECODE_INSTR_SHIFTCNT(uint32_t val)
 
 #define REG_A4XX_TPL1_TP_MODE_CONTROL                          0x00000f03
 
+#define REG_A4XX_TPL1_PERFCTR_TP_SEL_0                         0x00000f04
+
+#define REG_A4XX_TPL1_PERFCTR_TP_SEL_1                         0x00000f05
+
+#define REG_A4XX_TPL1_PERFCTR_TP_SEL_2                         0x00000f06
+
+#define REG_A4XX_TPL1_PERFCTR_TP_SEL_3                         0x00000f07
+
+#define REG_A4XX_TPL1_PERFCTR_TP_SEL_4                         0x00000f08
+
+#define REG_A4XX_TPL1_PERFCTR_TP_SEL_5                         0x00000f09
+
+#define REG_A4XX_TPL1_PERFCTR_TP_SEL_6                         0x00000f0a
+
 #define REG_A4XX_TPL1_PERFCTR_TP_SEL_7                         0x00000f0b
 
 #define REG_A4XX_TPL1_TP_TEX_OFFSET                            0x00002380
@@ -2080,10 +3149,24 @@ static inline uint32_t A4XX_TPL1_TP_TEX_COUNT_GS(uint32_t val)
 
 #define REG_A4XX_GRAS_PERFCTR_TSE_SEL_0                                0x00000c88
 
+#define REG_A4XX_GRAS_PERFCTR_TSE_SEL_1                                0x00000c89
+
+#define REG_A4XX_GRAS_PERFCTR_TSE_SEL_2                                0x00000c8a
+
 #define REG_A4XX_GRAS_PERFCTR_TSE_SEL_3                                0x00000c8b
 
+#define REG_A4XX_GRAS_PERFCTR_RAS_SEL_0                                0x00000c8c
+
+#define REG_A4XX_GRAS_PERFCTR_RAS_SEL_1                                0x00000c8d
+
+#define REG_A4XX_GRAS_PERFCTR_RAS_SEL_2                                0x00000c8e
+
+#define REG_A4XX_GRAS_PERFCTR_RAS_SEL_3                                0x00000c8f
+
 #define REG_A4XX_GRAS_CL_CLIP_CNTL                             0x00002000
 #define A4XX_GRAS_CL_CLIP_CNTL_CLIP_DISABLE                    0x00008000
+#define A4XX_GRAS_CL_CLIP_CNTL_ZNEAR_CLIP_DISABLE              0x00010000
+#define A4XX_GRAS_CL_CLIP_CNTL_ZFAR_CLIP_DISABLE               0x00020000
 #define A4XX_GRAS_CL_CLIP_CNTL_ZERO_GB_SCALE_Z                 0x00400000
 
 #define REG_A4XX_GRAS_CLEAR_CNTL                               0x00002003
@@ -2175,6 +3258,7 @@ static inline uint32_t A4XX_GRAS_SU_POINT_SIZE(float val)
 
 #define REG_A4XX_GRAS_ALPHA_CONTROL                            0x00002073
 #define A4XX_GRAS_ALPHA_CONTROL_ALPHA_TEST_ENABLE              0x00000004
+#define A4XX_GRAS_ALPHA_CONTROL_FORCE_FRAGZ_TO_FS              0x00000008
 
 #define REG_A4XX_GRAS_SU_POLY_OFFSET_SCALE                     0x00002074
 #define A4XX_GRAS_SU_POLY_OFFSET_SCALE__MASK                   0xffffffff
@@ -2219,6 +3303,7 @@ static inline uint32_t A4XX_GRAS_SU_MODE_CONTROL_LINEHALFWIDTH(float val)
        return ((((int32_t)(val * 4.0))) << A4XX_GRAS_SU_MODE_CONTROL_LINEHALFWIDTH__SHIFT) & A4XX_GRAS_SU_MODE_CONTROL_LINEHALFWIDTH__MASK;
 }
 #define A4XX_GRAS_SU_MODE_CONTROL_POLY_OFFSET                  0x00000800
+#define A4XX_GRAS_SU_MODE_CONTROL_MSAA_ENABLE                  0x00002000
 #define A4XX_GRAS_SU_MODE_CONTROL_RENDERING_PASS               0x00100000
 
 #define REG_A4XX_GRAS_SC_CONTROL                               0x0000207b
@@ -2346,6 +3431,20 @@ static inline uint32_t A4XX_GRAS_SC_EXTENT_WINDOW_TL_Y(uint32_t val)
 
 #define REG_A4XX_UCHE_CACHE_WAYS_VFD                           0x00000e8c
 
+#define REG_A4XX_UCHE_PERFCTR_UCHE_SEL_0                       0x00000e8e
+
+#define REG_A4XX_UCHE_PERFCTR_UCHE_SEL_1                       0x00000e8f
+
+#define REG_A4XX_UCHE_PERFCTR_UCHE_SEL_2                       0x00000e90
+
+#define REG_A4XX_UCHE_PERFCTR_UCHE_SEL_3                       0x00000e91
+
+#define REG_A4XX_UCHE_PERFCTR_UCHE_SEL_4                       0x00000e92
+
+#define REG_A4XX_UCHE_PERFCTR_UCHE_SEL_5                       0x00000e93
+
+#define REG_A4XX_UCHE_PERFCTR_UCHE_SEL_6                       0x00000e94
+
 #define REG_A4XX_UCHE_PERFCTR_UCHE_SEL_7                       0x00000e95
 
 #define REG_A4XX_HLSQ_TIMEOUT_THRESHOLD                                0x00000e00
@@ -2356,6 +3455,22 @@ static inline uint32_t A4XX_GRAS_SC_EXTENT_WINDOW_TL_Y(uint32_t val)
 
 #define REG_A4XX_HLSQ_PERF_PIPE_MASK                           0x00000e0e
 
+#define REG_A4XX_HLSQ_PERFCTR_HLSQ_SEL_0                       0x00000e06
+
+#define REG_A4XX_HLSQ_PERFCTR_HLSQ_SEL_1                       0x00000e07
+
+#define REG_A4XX_HLSQ_PERFCTR_HLSQ_SEL_2                       0x00000e08
+
+#define REG_A4XX_HLSQ_PERFCTR_HLSQ_SEL_3                       0x00000e09
+
+#define REG_A4XX_HLSQ_PERFCTR_HLSQ_SEL_4                       0x00000e0a
+
+#define REG_A4XX_HLSQ_PERFCTR_HLSQ_SEL_5                       0x00000e0b
+
+#define REG_A4XX_HLSQ_PERFCTR_HLSQ_SEL_6                       0x00000e0c
+
+#define REG_A4XX_HLSQ_PERFCTR_HLSQ_SEL_7                       0x00000e0d
+
 #define REG_A4XX_HLSQ_CONTROL_0_REG                            0x000023c0
 #define A4XX_HLSQ_CONTROL_0_REG_FSTHREADSIZE__MASK             0x00000010
 #define A4XX_HLSQ_CONTROL_0_REG_FSTHREADSIZE__SHIFT            4
@@ -2606,14 +3721,42 @@ static inline uint32_t A4XX_HLSQ_GS_CONTROL_REG_INSTRLENGTH(uint32_t val)
 #define REG_A4XX_PC_BINNING_COMMAND                            0x00000d00
 #define A4XX_PC_BINNING_COMMAND_BINNING_ENABLE                 0x00000001
 
+#define REG_A4XX_PC_TESSFACTOR_ADDR                            0x00000d08
+
 #define REG_A4XX_PC_DRAWCALL_SETUP_OVERRIDE                    0x00000d0c
 
 #define REG_A4XX_PC_PERFCTR_PC_SEL_0                           0x00000d10
 
+#define REG_A4XX_PC_PERFCTR_PC_SEL_1                           0x00000d11
+
+#define REG_A4XX_PC_PERFCTR_PC_SEL_2                           0x00000d12
+
+#define REG_A4XX_PC_PERFCTR_PC_SEL_3                           0x00000d13
+
+#define REG_A4XX_PC_PERFCTR_PC_SEL_4                           0x00000d14
+
+#define REG_A4XX_PC_PERFCTR_PC_SEL_5                           0x00000d15
+
+#define REG_A4XX_PC_PERFCTR_PC_SEL_6                           0x00000d16
+
 #define REG_A4XX_PC_PERFCTR_PC_SEL_7                           0x00000d17
 
 #define REG_A4XX_PC_BIN_BASE                                   0x000021c0
 
+#define REG_A4XX_PC_VSTREAM_CONTROL                            0x000021c2
+#define A4XX_PC_VSTREAM_CONTROL_SIZE__MASK                     0x003f0000
+#define A4XX_PC_VSTREAM_CONTROL_SIZE__SHIFT                    16
+static inline uint32_t A4XX_PC_VSTREAM_CONTROL_SIZE(uint32_t val)
+{
+       return ((val) << A4XX_PC_VSTREAM_CONTROL_SIZE__SHIFT) & A4XX_PC_VSTREAM_CONTROL_SIZE__MASK;
+}
+#define A4XX_PC_VSTREAM_CONTROL_N__MASK                                0x07c00000
+#define A4XX_PC_VSTREAM_CONTROL_N__SHIFT                       22
+static inline uint32_t A4XX_PC_VSTREAM_CONTROL_N(uint32_t val)
+{
+       return ((val) << A4XX_PC_VSTREAM_CONTROL_N__SHIFT) & A4XX_PC_VSTREAM_CONTROL_N__MASK;
+}
+
 #define REG_A4XX_PC_PRIM_VTX_CNTL                              0x000021c4
 #define A4XX_PC_PRIM_VTX_CNTL_VAROUT__MASK                     0x0000000f
 #define A4XX_PC_PRIM_VTX_CNTL_VAROUT__SHIFT                    0
@@ -2625,7 +3768,20 @@ static inline uint32_t A4XX_PC_PRIM_VTX_CNTL_VAROUT(uint32_t val)
 #define A4XX_PC_PRIM_VTX_CNTL_PROVOKING_VTX_LAST               0x02000000
 #define A4XX_PC_PRIM_VTX_CNTL_PSIZE                            0x04000000
 
-#define REG_A4XX_UNKNOWN_21C5                                  0x000021c5
+#define REG_A4XX_PC_PRIM_VTX_CNTL2                             0x000021c5
+#define A4XX_PC_PRIM_VTX_CNTL2_POLYMODE_FRONT_PTYPE__MASK      0x00000007
+#define A4XX_PC_PRIM_VTX_CNTL2_POLYMODE_FRONT_PTYPE__SHIFT     0
+static inline uint32_t A4XX_PC_PRIM_VTX_CNTL2_POLYMODE_FRONT_PTYPE(enum adreno_pa_su_sc_draw val)
+{
+       return ((val) << A4XX_PC_PRIM_VTX_CNTL2_POLYMODE_FRONT_PTYPE__SHIFT) & A4XX_PC_PRIM_VTX_CNTL2_POLYMODE_FRONT_PTYPE__MASK;
+}
+#define A4XX_PC_PRIM_VTX_CNTL2_POLYMODE_BACK_PTYPE__MASK       0x00000038
+#define A4XX_PC_PRIM_VTX_CNTL2_POLYMODE_BACK_PTYPE__SHIFT      3
+static inline uint32_t A4XX_PC_PRIM_VTX_CNTL2_POLYMODE_BACK_PTYPE(enum adreno_pa_su_sc_draw val)
+{
+       return ((val) << A4XX_PC_PRIM_VTX_CNTL2_POLYMODE_BACK_PTYPE__SHIFT) & A4XX_PC_PRIM_VTX_CNTL2_POLYMODE_BACK_PTYPE__MASK;
+}
+#define A4XX_PC_PRIM_VTX_CNTL2_POLYMODE_ENABLE                 0x00000040
 
 #define REG_A4XX_PC_RESTART_INDEX                              0x000021c6
 
@@ -2663,12 +3819,8 @@ static inline uint32_t A4XX_PC_HS_PARAM_SPACING(enum a4xx_tess_spacing val)
 {
        return ((val) << A4XX_PC_HS_PARAM_SPACING__SHIFT) & A4XX_PC_HS_PARAM_SPACING__MASK;
 }
-#define A4XX_PC_HS_PARAM_PRIMTYPE__MASK                                0x01800000
-#define A4XX_PC_HS_PARAM_PRIMTYPE__SHIFT                       23
-static inline uint32_t A4XX_PC_HS_PARAM_PRIMTYPE(enum adreno_pa_su_sc_draw val)
-{
-       return ((val) << A4XX_PC_HS_PARAM_PRIMTYPE__SHIFT) & A4XX_PC_HS_PARAM_PRIMTYPE__MASK;
-}
+#define A4XX_PC_HS_PARAM_CW                                    0x00800000
+#define A4XX_PC_HS_PARAM_CONNECTED                             0x01000000
 
 #define REG_A4XX_VBIF_VERSION                                  0x00003000
 
@@ -2850,7 +4002,7 @@ static inline uint32_t A4XX_TEX_CONST_1_HEIGHT(uint32_t val)
 {
        return ((val) << A4XX_TEX_CONST_1_HEIGHT__SHIFT) & A4XX_TEX_CONST_1_HEIGHT__MASK;
 }
-#define A4XX_TEX_CONST_1_WIDTH__MASK                           0x1fff8000
+#define A4XX_TEX_CONST_1_WIDTH__MASK                           0x3fff8000
 #define A4XX_TEX_CONST_1_WIDTH__SHIFT                          15
 static inline uint32_t A4XX_TEX_CONST_1_WIDTH(uint32_t val)
 {
@@ -2882,6 +4034,7 @@ static inline uint32_t A4XX_TEX_CONST_2_SWAP(enum a3xx_color_swap val)
 #define A4XX_TEX_CONST_3_LAYERSZ__SHIFT                                0
 static inline uint32_t A4XX_TEX_CONST_3_LAYERSZ(uint32_t val)
 {
+       assert(!(val & 0xfff));
        return ((val >> 12) << A4XX_TEX_CONST_3_LAYERSZ__SHIFT) & A4XX_TEX_CONST_3_LAYERSZ__MASK;
 }
 #define A4XX_TEX_CONST_3_DEPTH__MASK                           0x7ffc0000
@@ -2896,12 +4049,14 @@ static inline uint32_t A4XX_TEX_CONST_3_DEPTH(uint32_t val)
 #define A4XX_TEX_CONST_4_LAYERSZ__SHIFT                                0
 static inline uint32_t A4XX_TEX_CONST_4_LAYERSZ(uint32_t val)
 {
+       assert(!(val & 0xfff));
        return ((val >> 12) << A4XX_TEX_CONST_4_LAYERSZ__SHIFT) & A4XX_TEX_CONST_4_LAYERSZ__MASK;
 }
 #define A4XX_TEX_CONST_4_BASE__MASK                            0xffffffe0
 #define A4XX_TEX_CONST_4_BASE__SHIFT                           5
 static inline uint32_t A4XX_TEX_CONST_4_BASE(uint32_t val)
 {
+       assert(!(val & 0x1f));
        return ((val >> 5) << A4XX_TEX_CONST_4_BASE__SHIFT) & A4XX_TEX_CONST_4_BASE__MASK;
 }