i965/vec4: use vec4_builder to emit instructions in setup_imm_df()

author Samuel Iglesias Gonsálvez <siglesias@igalia.com>

Tue, 7 Mar 2017 09:29:53 +0000 (10:29 +0100)

committer Francisco Jerez <currojerez@riseup.net>

Fri, 14 Apr 2017 21:56:09 +0000 (14:56 -0700)
author Samuel Iglesias Gonsálvez <siglesias@igalia.com>
Tue, 7 Mar 2017 09:29:53 +0000 (10:29 +0100)
committer Francisco Jerez <currojerez@riseup.net>
Fri, 14 Apr 2017 21:56:09 +0000 (14:56 -0700)
diff --git a/src/intel/compiler/brw_vec4.h b/src/intel/compiler/brw_vec4.h

index d12405c22e1c7bc7a2fce5815a9db526cb737d88..89adfaa7b79f8f0b44e13367b680356bd4aa2223 100644 (file)
--- a/src/intel/compiler/brw_vec4.h
+++ b/src/intel/compiler/brw_vec4.h
@@ -28,6 +28,7 @@
  
  #ifdef __cplusplus
  #include "brw_ir_vec4.h"
+#include "brw_vec4_builder.h"
  #endif
  
  #include "compiler/glsl/ir.h"
@@ -324,8 +325,6 @@ public:
     void emit_conversion_from_double(dst_reg dst, src_reg src, bool saturate);
     void emit_conversion_to_double(dst_reg dst, src_reg src, bool saturate);
  
-   src_reg setup_imm_df(double v);
-
     vec4_instruction *shuffle_64bit_data(dst_reg dst, src_reg src,
                                          bool for_write,
                                          bblock_t *block = NULL,
diff --git a/src/intel/compiler/brw_vec4_nir.cpp b/src/intel/compiler/brw_vec4_nir.cpp

index 9d9ded2b9657c29b8d76fe841f1fc6f1a37b0b1f..a82d52088a8770f2ebae9473ccc2822a8d96cc7e 100644 (file)
--- a/src/intel/compiler/brw_vec4_nir.cpp
+++ b/src/intel/compiler/brw_vec4_nir.cpp
@@ -353,6 +353,53 @@ vec4_visitor::get_indirect_offset(nir_intrinsic_instr *instr)
     return get_nir_src(*offset_src, BRW_REGISTER_TYPE_UD, 1);
  }
  
+static src_reg
+setup_imm_df(const vec4_builder &bld, double v)
+{
+   const gen_device_info *devinfo = bld.shader->devinfo;
+   assert(devinfo->gen >= 7);
+
+   if (devinfo->gen >= 8)
+      return brw_imm_df(v);
+
+   /* gen7.5 does not support DF immediates straighforward but the DIM
+    * instruction allows to set the 64-bit immediate value.
+    */
+   if (devinfo->is_haswell) {
+      const vec4_builder ubld = bld.exec_all();
+      const dst_reg dst = bld.vgrf(BRW_REGISTER_TYPE_DF);
+      ubld.DIM(dst, brw_imm_df(v));
+      return swizzle(src_reg(dst), BRW_SWIZZLE_XXXX);
+   }
+
+   /* gen7 does not support DF immediates */
+   union {
+      double d;
+      struct {
+         uint32_t i1;
+         uint32_t i2;
+      };
+   } di;
+
+   di.d = v;
+
+   /* Write the low 32-bit of the constant to the X:UD channel and the
+    * high 32-bit to the Y:UD channel to build the constant in a VGRF.
+    * We have to do this twice (offset 0 and offset 1), since a DF VGRF takes
+    * two SIMD8 registers in SIMD4x2 execution. Finally, return a swizzle
+    * XXXX so any access to the VGRF only reads the constant data in these
+    * channels.
+    */
+   const dst_reg tmp = bld.vgrf(BRW_REGISTER_TYPE_UD, 2);
+   for (unsigned n = 0; n < 2; n++) {
+      const vec4_builder ubld = bld.exec_all().group(4, n);
+      ubld.MOV(writemask(offset(tmp, 8, n), WRITEMASK_X), brw_imm_ud(di.i1));
+      ubld.MOV(writemask(offset(tmp, 8, n), WRITEMASK_Y), brw_imm_ud(di.i2));
+   }
+
+   return swizzle(src_reg(retype(tmp, BRW_REGISTER_TYPE_DF)), BRW_SWIZZLE_XXXX);
+}
+
  void
  vec4_visitor::nir_emit_load_const(nir_load_const_instr *instr)
  {
@@ -366,6 +413,7 @@ vec4_visitor::nir_emit_load_const(nir_load_const_instr *instr)
        reg.type = BRW_REGISTER_TYPE_D;
     }
  
+   const vec4_builder ibld = vec4_builder(this).at_end();
     unsigned remaining = brw_writemask_for_size(instr->def.num_components);
  
     /* @FIXME: consider emitting vector operations to save some MOVs in
@@ -389,7 +437,7 @@ vec4_visitor::nir_emit_load_const(nir_load_const_instr *instr)
  
        reg.writemask = writemask;
        if (instr->def.bit_size == 64) {
-         emit(MOV(reg, setup_imm_df(instr->value.f64[i])));
+         emit(MOV(reg, setup_imm_df(ibld, instr->value.f64[i])));
        } else {
           emit(MOV(reg, brw_imm_d(instr->value.i32[i])));
        }
@@ -1220,53 +1268,6 @@ vec4_visitor::emit_conversion_to_double(dst_reg dst, src_reg src,
     inst->saturate = saturate;
  }
  
-src_reg
-vec4_visitor::setup_imm_df(double v)
-{
-   assert(devinfo->gen >= 7);
-
-   if (devinfo->gen >= 8)
-      return brw_imm_df(v);
-
-   /* gen7.5 does not support DF immediates straighforward but the DIM
-    * instruction allows to set the 64-bit immediate value.
-    */
-   if (devinfo->is_haswell) {
-      dst_reg dst = retype(dst_reg(VGRF, alloc.allocate(2)), BRW_REGISTER_TYPE_DF);
-      emit(DIM(dst, brw_imm_df(v)))->force_writemask_all = true;
-      return swizzle(src_reg(retype(dst, BRW_REGISTER_TYPE_DF)), BRW_SWIZZLE_XXXX);
-   }
-
-   /* gen7 does not support DF immediates */
-   union {
-      double d;
-      struct {
-         uint32_t i1;
-         uint32_t i2;
-      };
-   } di;
-
-   di.d = v;
-
-   /* Write the low 32-bit of the constant to the X:UD channel and the
-    * high 32-bit to the Y:UD channel to build the constant in a VGRF.
-    * We have to do this twice (offset 0 and offset 1), since a DF VGRF takes
-    * two SIMD8 registers in SIMD4x2 execution. Finally, return a swizzle
-    * XXXX so any access to the VGRF only reads the constant data in these
-    * channels.
-    */
-   const dst_reg tmp =
-      retype(dst_reg(VGRF, alloc.allocate(2)), BRW_REGISTER_TYPE_UD);
-   for (int n = 0; n < 2; n++) {
-      emit(MOV(writemask(offset(tmp, 8, n), WRITEMASK_X), brw_imm_ud(di.i1)))
-         ->force_writemask_all = true;
-      emit(MOV(writemask(offset(tmp, 8, n), WRITEMASK_Y), brw_imm_ud(di.i2)))
-         ->force_writemask_all = true;
-   }
-
-   return swizzle(src_reg(retype(tmp, BRW_REGISTER_TYPE_DF)), BRW_SWIZZLE_XXXX);
-}
-
  void
  vec4_visitor::nir_emit_alu(nir_alu_instr *instr)
  {
author	Samuel Iglesias Gonsálvez <siglesias@igalia.com>
	Tue, 7 Mar 2017 09:29:53 +0000 (10:29 +0100)
committer	Francisco Jerez <currojerez@riseup.net>
	Fri, 14 Apr 2017 21:56:09 +0000 (14:56 -0700)
src/intel/compiler/brw_vec4.h		patch \| blob \| history
src/intel/compiler/brw_vec4_nir.cpp		patch \| blob \| history