From e73a8a9703b3be23ece12c1092185926522b6c4d Mon Sep 17 00:00:00 2001 From: Rob Clark Date: Mon, 16 Mar 2020 06:47:05 -0700 Subject: [PATCH] freedreno/ir3/cf: handle widening too We can also fold f16->f32 conversions. Signed-off-by: Rob Clark Part-of: --- src/freedreno/ir3/ir3_cf.c | 38 ++++++++++++++++++++++++++++++++------ 1 file changed, 32 insertions(+), 6 deletions(-) diff --git a/src/freedreno/ir3/ir3_cf.c b/src/freedreno/ir3/ir3_cf.c index 2c2dc06c27a..636ed384d79 100644 --- a/src/freedreno/ir3/ir3_cf.c +++ b/src/freedreno/ir3/ir3_cf.c @@ -26,11 +26,26 @@ static bool is_fp16_conv(struct ir3_instruction *instr) { - if (instr->opc == OPC_MOV && - instr->cat1.src_type == TYPE_F32 && + if (instr->opc != OPC_MOV) + return false; + + struct ir3_register *dst = instr->regs[0]; + struct ir3_register *src = instr->regs[1]; + + /* disallow conversions that cannot be folded into + * alu instructions: + */ + if (dst->flags & (IR3_REG_EVEN | IR3_REG_POS_INF)) + return false; + + if (instr->cat1.src_type == TYPE_F32 && instr->cat1.dst_type == TYPE_F16) return true; + if (instr->cat1.src_type == TYPE_F16 && + instr->cat1.dst_type == TYPE_F32) + return true; + return false; } @@ -77,8 +92,15 @@ try_conversion_folding(struct ir3 *ir, struct ir3_instruction *conv) if (!is_alu(src)) return; + /* avoid folding f2f32(f2f16) together, in cases where this is legal to + * do (glsl) nir should have handled that for us already: + */ + if (is_fp16_conv(src)) + return; + switch (src->opc) { case OPC_SEL_B32: + case OPC_SEL_B16: case OPC_MAX_F: case OPC_MIN_F: case OPC_SIGN_F: @@ -97,18 +119,22 @@ try_conversion_folding(struct ir3 *ir, struct ir3_instruction *conv) * change the dst type to F32 to get the right behavior, since we * could be moving a float with a u32.u32 move. */ - src->cat1.dst_type = TYPE_F16; - src->cat1.src_type = TYPE_F32; + src->cat1.dst_type = conv->cat1.dst_type; + src->cat1.src_type = conv->cat1.src_type; } else { /* Otherwise, for typechanging movs, we can just change the dst * type to F16 to collaps the two conversions. For example * cov.s32f32 follwed by cov.f32f16 becomes cov.s32f16. */ - src->cat1.dst_type = TYPE_F16; + src->cat1.dst_type = conv->cat1.dst_type; } } - src->regs[0]->flags |= IR3_REG_HALF; + if (conv->regs[0]->flags & IR3_REG_HALF) { + src->regs[0]->flags |= IR3_REG_HALF; + } else { + src->regs[0]->flags &= ~IR3_REG_HALF; + } rewrite_uses(ir, conv, src); } -- 2.30.2