freedreno/ir3: Support 16-bit comparison instructions
authorNeil Roberts <nroberts@igalia.com>
Wed, 30 Jan 2019 15:33:05 +0000 (16:33 +0100)
committerNeil Roberts <nroberts@igalia.com>
Wed, 20 Nov 2019 13:09:43 +0000 (14:09 +0100)
v2. [Hyunjun Ko (zzoon@igalia.com)]
Avoid using too much open code like "instr->regs[n]->flags |= FOO"

v3. [Hyunjun Ko (zzoon@igalia.com)]
Remove redundant code for both 16b and 32b operations.

Reviewed-by: Rob Clark <robdclark@gmail.com>
src/freedreno/ir3/ir3_compiler_nir.c

index 5e9eb9d1c3e1ac6f51318a07f39759550f774ea9..a960f0258ca49a307df7d6e2d6b546831288b604 100644 (file)
@@ -461,18 +461,22 @@ emit_alu(struct ir3_context *ctx, nir_alu_instr *alu)
                dst[0]->cat5.type = TYPE_F32;
                break;
                break;
+       case nir_op_flt16:
        case nir_op_flt32:
                dst[0] = ir3_CMPS_F(b, src[0], 0, src[1], 0);
                dst[0]->cat2.condition = IR3_COND_LT;
                break;
+       case nir_op_fge16:
        case nir_op_fge32:
                dst[0] = ir3_CMPS_F(b, src[0], 0, src[1], 0);
                dst[0]->cat2.condition = IR3_COND_GE;
                break;
+       case nir_op_feq16:
        case nir_op_feq32:
                dst[0] = ir3_CMPS_F(b, src[0], 0, src[1], 0);
                dst[0]->cat2.condition = IR3_COND_EQ;
                break;
+       case nir_op_fne16:
        case nir_op_fne32:
                dst[0] = ir3_CMPS_F(b, src[0], 0, src[1], 0);
                dst[0]->cat2.condition = IR3_COND_NE;
@@ -572,26 +576,32 @@ emit_alu(struct ir3_context *ctx, nir_alu_instr *alu)
        case nir_op_ushr:
                dst[0] = ir3_SHR_B(b, src[0], 0, src[1], 0);
                break;
+       case nir_op_ilt16:
        case nir_op_ilt32:
                dst[0] = ir3_CMPS_S(b, src[0], 0, src[1], 0);
                dst[0]->cat2.condition = IR3_COND_LT;
                break;
+       case nir_op_ige16:
        case nir_op_ige32:
                dst[0] = ir3_CMPS_S(b, src[0], 0, src[1], 0);
                dst[0]->cat2.condition = IR3_COND_GE;
                break;
+       case nir_op_ieq16:
        case nir_op_ieq32:
                dst[0] = ir3_CMPS_S(b, src[0], 0, src[1], 0);
                dst[0]->cat2.condition = IR3_COND_EQ;
                break;
+       case nir_op_ine16:
        case nir_op_ine32:
                dst[0] = ir3_CMPS_S(b, src[0], 0, src[1], 0);
                dst[0]->cat2.condition = IR3_COND_NE;
                break;
+       case nir_op_ult16:
        case nir_op_ult32:
                dst[0] = ir3_CMPS_U(b, src[0], 0, src[1], 0);
                dst[0]->cat2.condition = IR3_COND_LT;
                break;
+       case nir_op_uge16:
        case nir_op_uge32:
                dst[0] = ir3_CMPS_U(b, src[0], 0, src[1], 0);
                dst[0]->cat2.condition = IR3_COND_GE;
@@ -665,9 +675,19 @@ emit_alu(struct ir3_context *ctx, nir_alu_instr *alu)
 
        if (nir_alu_type_get_base_type(info->output_type) == nir_type_bool) {
                assert(dst_sz == 1);
+
+               if (nir_dest_bit_size(alu->dest.dest) < 32)
+                       dst[0]->regs[0]->flags |= IR3_REG_HALF;
+
                dst[0] = ir3_n2b(b, dst[0]);
        }
 
+       if (nir_dest_bit_size(alu->dest.dest) < 32) {
+               for (unsigned i = 0; i < dst_sz; i++) {
+                       dst[i]->regs[0]->flags |= IR3_REG_HALF;
+               }
+       }
+
        ir3_put_dst(ctx, &alu->dest.dest);
 }