nir: Add a fdot instruction that replicates the result to a vec4

author Jason Ekstrand <jason.ekstrand@intel.com>

Thu, 10 Sep 2015 17:51:46 +0000 (10:51 -0700)

committer Jason Ekstrand <jason.ekstrand@intel.com>

Tue, 15 Sep 2015 19:38:48 +0000 (12:38 -0700)
author Jason Ekstrand <jason.ekstrand@intel.com>
Thu, 10 Sep 2015 17:51:46 +0000 (10:51 -0700)
committer Jason Ekstrand <jason.ekstrand@intel.com>
Tue, 15 Sep 2015 19:38:48 +0000 (12:38 -0700)
diff --git a/src/glsl/nir/nir.h b/src/glsl/nir/nir.h

index 3f693b17fb147ba3bf67b002e50f05277a90f0a6..4e4543ad5ec992e88cf7224af8d00b8f31366645 100644 (file)
--- a/src/glsl/nir/nir.h
+++ b/src/glsl/nir/nir.h
@@ -1434,6 +1434,12 @@ typedef struct nir_shader_compiler_options {
     /* lower {slt,sge,seq,sne} to {flt,fge,feq,fne} + b2f: */
     bool lower_scmp;
  
+   /* Does the native fdot instruction replicate its result for four
+    * components?  If so, then opt_algebraic_late will turn all fdotN
+    * instructions into fdot_replicatedN instructions.
+    */
+   bool fdot_replicates;
+
     /**
      * Does the driver support real 32-bit integers?  (Otherwise, integers
      * are simulated by floats.)
diff --git a/src/glsl/nir/nir_opcodes.py b/src/glsl/nir/nir_opcodes.py

index df5b7e2d517c2057328147c2a9ff462dd13e5013..495d109375b995089ec05452f00defd5284febe3 100644 (file)
--- a/src/glsl/nir/nir_opcodes.py
+++ b/src/glsl/nir/nir_opcodes.py
@@ -453,6 +453,9 @@ binop("fxor", tfloat, commutative,
  binop_reduce("fdot", 1, tfloat, tfloat, "{src0} * {src1}", "{src0} + {src1}",
               "{src}")
  
+binop_reduce("fdot_replicated", 4, tfloat, tfloat,
+             "{src0} * {src1}", "{src0} + {src1}", "{src}")
+
  binop("fmin", tfloat, "", "fminf(src0, src1)")
  binop("imin", tint, commutative + associative, "src1 > src0 ? src0 : src1")
  binop("umin", tunsigned, commutative + associative, "src1 > src0 ? src0 : src1")
diff --git a/src/glsl/nir/nir_opt_algebraic.py b/src/glsl/nir/nir_opt_algebraic.py

index 226e0a8d85c3696584a9406608af49b4f58619eb..acc3b04b118089e366f83c7f6eb331da149b0c46 100644 (file)
--- a/src/glsl/nir/nir_opt_algebraic.py
+++ b/src/glsl/nir/nir_opt_algebraic.py
@@ -240,6 +240,9 @@ late_optimizations = [
     (('fge', ('fadd', a, b), 0.0), ('fge', a, ('fneg', b))),
     (('feq', ('fadd', a, b), 0.0), ('feq', a, ('fneg', b))),
     (('fne', ('fadd', a, b), 0.0), ('fne', a, ('fneg', b))),
+   (('fdot2', a, b), ('fdot_replicated2', a, b), 'options->fdot_replicates'),
+   (('fdot3', a, b), ('fdot_replicated3', a, b), 'options->fdot_replicates'),
+   (('fdot4', a, b), ('fdot_replicated4', a, b), 'options->fdot_replicates'),
  ]
  
  print nir_algebraic.AlgebraicPass("nir_opt_algebraic", optimizations).render()
author	Jason Ekstrand <jason.ekstrand@intel.com>
	Thu, 10 Sep 2015 17:51:46 +0000 (10:51 -0700)
committer	Jason Ekstrand <jason.ekstrand@intel.com>
	Tue, 15 Sep 2015 19:38:48 +0000 (12:38 -0700)
src/glsl/nir/nir.h		patch \| blob \| history
src/glsl/nir/nir_opcodes.py		patch \| blob \| history
src/glsl/nir/nir_opt_algebraic.py		patch \| blob \| history