From 277f37d036159d373ec9726fe00148d5e49da875 Mon Sep 17 00:00:00 2001 From: =?utf8?q?Timur=20Krist=C3=B3f?= Date: Thu, 23 Apr 2020 15:50:56 +0200 Subject: [PATCH] aco: Use 24-bit multiplication for NGG wave id and thread id. MIME-Version: 1.0 Content-Type: text/plain; charset=utf8 Content-Transfer-Encoding: 8bit Both of them should always fit 24 bits anyway. Signed-off-by: Timur Kristóf Reviewed-by: Rhys Perry Part-of: --- src/amd/compiler/aco_instruction_selection.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/amd/compiler/aco_instruction_selection.cpp b/src/amd/compiler/aco_instruction_selection.cpp index 2dc9fc64ea3..bca192d7564 100644 --- a/src/amd/compiler/aco_instruction_selection.cpp +++ b/src/amd/compiler/aco_instruction_selection.cpp @@ -10614,9 +10614,9 @@ void ngg_emit_nogs_output(isel_context *ctx) Temp wave_id_in_tg = bld.sop2(aco_opcode::s_bfe_u32, bld.def(s1), bld.def(s1, scc), get_arg(ctx, ctx->args->merged_wave_info), Operand(24u | (4u << 16))); Temp thread_id_in_wave = emit_mbcnt(ctx, bld.def(v1)); - Temp wave_id_mul = bld.v_mul_imm(bld.def(v1), as_vgpr(ctx, wave_id_in_tg), ctx->program->wave_size); + Temp wave_id_mul = bld.v_mul24_imm(bld.def(v1), as_vgpr(ctx, wave_id_in_tg), ctx->program->wave_size); Temp thread_id_in_tg = bld.vadd32(bld.def(v1), Operand(wave_id_mul), Operand(thread_id_in_wave)); - Temp addr = bld.v_mul_imm(bld.def(v1), thread_id_in_tg, 4u); + Temp addr = bld.v_mul24_imm(bld.def(v1), thread_id_in_tg, 4u); /* Load primitive ID from LDS. */ prim_id = load_lds(ctx, 4, bld.tmp(v1), addr, 0u, 4u); -- 2.30.2