i965/vec4: fix swizzle and writemask when loading an uniform with constant offset

author Samuel Iglesias Gonsálvez <siglesias@igalia.com>

Wed, 19 Apr 2017 08:35:07 +0000 (10:35 +0200)

committer Samuel Iglesias Gonsálvez <siglesias@igalia.com>

Thu, 18 May 2017 04:49:54 +0000 (06:49 +0200)
author Samuel Iglesias Gonsálvez <siglesias@igalia.com>
Wed, 19 Apr 2017 08:35:07 +0000 (10:35 +0200)
committer Samuel Iglesias Gonsálvez <siglesias@igalia.com>
Thu, 18 May 2017 04:49:54 +0000 (06:49 +0200)
diff --git a/src/intel/compiler/brw_vec4_nir.cpp b/src/intel/compiler/brw_vec4_nir.cpp

index 66324e3bcd7ff0a5877b719019c58ee701e71e9e..0e8807c5b42b57c6e0ab72411393a0751bb98e70 100644 (file)
--- a/src/intel/compiler/brw_vec4_nir.cpp
+++ b/src/intel/compiler/brw_vec4_nir.cpp
@@ -769,7 +769,8 @@ vec4_visitor::nir_emit_intrinsic(nir_intrinsic_instr *instr)
         * The swizzle also works in the indirect case as the generator adds
         * the swizzle to the offset for us.
         */
-      unsigned shift = (nir_intrinsic_base(instr) % 16) / 4;
+      const int type_size = type_sz(src.type);
+      unsigned shift = (nir_intrinsic_base(instr) % 16) / type_size;
        assert(shift + instr->num_components <= 4);
  
        nir_const_value *const_offset = nir_src_as_const_value(instr->src[0]);
@@ -777,14 +778,20 @@ vec4_visitor::nir_emit_intrinsic(nir_intrinsic_instr *instr)
           /* Offsets are in bytes but they should always be multiples of 4 */
           assert(const_offset->u32[0] % 4 == 0);
  
-         unsigned offset = const_offset->u32[0] + shift * 4;
+         src.swizzle = brw_swizzle_for_size(instr->num_components);
+         dest.writemask = brw_writemask_for_size(instr->num_components);
+         unsigned offset = const_offset->u32[0] + shift * type_size;
           src.offset = ROUND_DOWN_TO(offset, 16);
-         shift = (offset % 16) / 4;
+         shift = (offset % 16) / type_size;
+         assert(shift + instr->num_components <= 4);
           src.swizzle += BRW_SWIZZLE4(shift, shift, shift, shift);
  
           emit(MOV(dest, src));
        } else {
-         src.swizzle += BRW_SWIZZLE4(shift, shift, shift, shift);
+         /* Uniform arrays are vec4 aligned, because of std140 alignment
+          * rules.
+          */
+         assert(shift == 0);
  
           src_reg indirect = get_nir_src(instr->src[0], BRW_REGISTER_TYPE_UD, 1);
author	Samuel Iglesias Gonsálvez <siglesias@igalia.com>
	Wed, 19 Apr 2017 08:35:07 +0000 (10:35 +0200)
committer	Samuel Iglesias Gonsálvez <siglesias@igalia.com>
	Thu, 18 May 2017 04:49:54 +0000 (06:49 +0200)