i965/vec4: implement access to DF source components Z/W

author Iago Toral Quiroga <itoral@igalia.com>

Mon, 18 Jul 2016 11:43:00 +0000 (13:43 +0200)

committer Samuel Iglesias Gonsálvez <siglesias@igalia.com>

Tue, 3 Jan 2017 10:26:51 +0000 (11:26 +0100)
author Iago Toral Quiroga <itoral@igalia.com>
Mon, 18 Jul 2016 11:43:00 +0000 (13:43 +0200)
committer Samuel Iglesias Gonsálvez <siglesias@igalia.com>
Tue, 3 Jan 2017 10:26:51 +0000 (11:26 +0100)
diff --git a/src/mesa/drivers/dri/i965/brw_vec4.cpp b/src/mesa/drivers/dri/i965/brw_vec4.cpp

index 6d73bb2faecf2556bf354b98d26eef873dab798b..cc0a76a7eb4fa1170cd1c456b12c85a9e642829b 100644 (file)
--- a/src/mesa/drivers/dri/i965/brw_vec4.cpp
+++ b/src/mesa/drivers/dri/i965/brw_vec4.cpp
@@ -2267,7 +2267,28 @@ vec4_visitor::apply_logical_swizzle(struct brw_reg *hw_reg,
      */
     assert(brw_is_single_value_swizzle(reg.swizzle));
  
+   /* To gain access to Z/W components we need to select the second half
+    * of the register and then use a X/Y swizzle to select Z/W respectively.
+    */
     unsigned swizzle = BRW_GET_SWZ(reg.swizzle, 0);
+
+   if (swizzle >= 2) {
+      *hw_reg = suboffset(*hw_reg, 2);
+      swizzle -= 2;
+   }
+
+   /* Any 64-bit source with an offset at 16B is intended to address the
+    * second half of a register and needs a vertical stride of 0 so we:
+    *
+    * 1. Don't violate register region restrictions.
+    * 2. Activate the gen7 instruction decompresion bug exploit when
+    *    execsize > 4
+    */
+   if (hw_reg->subnr % REG_SIZE == 16) {
+      assert(devinfo->gen == 7);
+      hw_reg->vstride = BRW_VERTICAL_STRIDE_0;
+   }
+
     hw_reg->swizzle = BRW_SWIZZLE4(swizzle * 2, swizzle * 2 + 1,
                                    swizzle * 2, swizzle * 2 + 1);
  }
author	Iago Toral Quiroga <itoral@igalia.com>
	Mon, 18 Jul 2016 11:43:00 +0000 (13:43 +0200)
committer	Samuel Iglesias Gonsálvez <siglesias@igalia.com>
	Tue, 3 Jan 2017 10:26:51 +0000 (11:26 +0100)