aco: remove copy in load_input_from_temps()

[mesa.git] / src / amd / compiler / aco_instruction_selection.cpp
diff --git a/src/amd/compiler/aco_instruction_selection.cpp b/src/amd/compiler/aco_instruction_selection.cpp

index 8552b06bf897ecaa048fcbdede68e87274a5102e..31a5e410e9f8042222107f567ea2f4d8a729ceda 100644 (file)
--- a/src/amd/compiler/aco_instruction_selection.cpp
+++ b/src/amd/compiler/aco_instruction_selection.cpp
@@ -561,16 +561,8 @@ void emit_vop2_instruction(isel_context *ctx, nir_alu_instr *instr, aco_opcode o
           Temp t = src0;
           src0 = src1;
           src1 = t;
-      } else if (src0.type() == RegType::vgpr &&
-                 op != aco_opcode::v_madmk_f32 &&
-                 op != aco_opcode::v_madak_f32 &&
-                 op != aco_opcode::v_madmk_f16 &&
-                 op != aco_opcode::v_madak_f16) {
-         /* If the instruction is not commutative, we emit a VOP3A instruction */
-         bld.vop2_e64(op, Definition(dst), src0, src1);
-         return;
        } else {
-         src1 = bld.copy(bld.def(RegType::vgpr, src1.size()), src1); //TODO: as_vgpr
+         src1 = as_vgpr(ctx, src1);
        }
     }
  
@@ -1639,7 +1631,7 @@ void visit_alu_instr(isel_context *ctx, nir_alu_instr *instr)
     }
     case nir_op_fsub: {
        Temp src0 = get_alu_src(ctx, instr->src[0]);
-      Temp src1 = as_vgpr(ctx, get_alu_src(ctx, instr->src[1]));
+      Temp src1 = get_alu_src(ctx, instr->src[1]);
        if (dst.regClass() == v2b) {
           Temp tmp = bld.tmp(v1);
           if (src1.type() == RegType::vgpr || src0.type() != RegType::vgpr)
@@ -1654,7 +1646,7 @@ void visit_alu_instr(isel_context *ctx, nir_alu_instr *instr)
              emit_vop2_instruction(ctx, instr, aco_opcode::v_subrev_f32, dst, true);
        } else if (dst.regClass() == v2) {
           Instruction* add = bld.vop3(aco_opcode::v_add_f64, Definition(dst),
-                                     src0, src1);
+                                     as_vgpr(ctx, src0), as_vgpr(ctx, src1));
           VOP3A_instruction* sub = static_cast<VOP3A_instruction*>(add);
           sub->neg[1] = true;
        } else {
@@ -3776,11 +3768,8 @@ bool load_input_from_temps(isel_context *ctx, nir_intrinsic_instr *instr, Temp d
  
     unsigned idx = nir_intrinsic_base(instr) + nir_intrinsic_component(instr) + 4 * nir_src_as_uint(*off_src);
     Temp *src = &ctx->inputs.temps[idx];
-   Temp vec = create_vec_from_array(ctx, src, dst.size(), dst.regClass().type(), 4u);
-   assert(vec.size() == dst.size());
+   create_vec_from_array(ctx, src, dst.size(), dst.regClass().type(), 4u, 0, dst);
  
-   Builder bld(ctx->program, ctx->block);
-   bld.copy(Definition(dst), vec);
     return true;
  }
  
@@ -9769,7 +9758,8 @@ static void create_vs_exports(isel_context *ctx)
     for (unsigned i = 0; i <= VARYING_SLOT_VAR31; ++i) {
        if (i < VARYING_SLOT_VAR0 &&
            i != VARYING_SLOT_LAYER &&
-          i != VARYING_SLOT_PRIMITIVE_ID)
+          i != VARYING_SLOT_PRIMITIVE_ID &&
+          i != VARYING_SLOT_VIEWPORT)
           continue;
  
        export_vs_varying(ctx, i, false, NULL);