nir/algebraic: add new fsum ops and fdot lowering

author Erico Nunes <nunes.erico@gmail.com>

Sat, 27 Jul 2019 15:58:53 +0000 (17:58 +0200)

committer Erico Nunes <nunes.erico@gmail.com>

Wed, 31 Jul 2019 19:35:58 +0000 (21:35 +0200)
author Erico Nunes <nunes.erico@gmail.com>
Sat, 27 Jul 2019 15:58:53 +0000 (17:58 +0200)
committer Erico Nunes <nunes.erico@gmail.com>
Wed, 31 Jul 2019 19:35:58 +0000 (21:35 +0200)
diff --git a/src/compiler/nir/nir.h b/src/compiler/nir/nir.h

index a3c44ff988e219200e35694fdbdb81fb73dfe756..088b8d7d5e81b3a3ab49988b928ef7c430ca8a78 100644 (file)
--- a/src/compiler/nir/nir.h
+++ b/src/compiler/nir/nir.h
@@ -2556,6 +2556,9 @@ typedef struct nir_shader_compiler_options {
     /* lower fdph to fdot4 */
     bool lower_fdph;
  
+   /** lower fdot to fmul and fsum/fadd. */
+   bool lower_fdot;
+
     /* Does the native fdot instruction replicate its result for four
      * components?  If so, then opt_algebraic_late will turn all fdotN
      * instructions into fdot_replicatedN instructions.
diff --git a/src/compiler/nir/nir_opcodes.py b/src/compiler/nir/nir_opcodes.py

index 7854faec15f4fc579236bb0779a4e03da5a171e5..3020da98264e8253bb3855579f9374b7c682c21e 100644 (file)
--- a/src/compiler/nir/nir_opcodes.py
+++ b/src/compiler/nir/nir_opcodes.py
@@ -439,6 +439,8 @@ if (src0.z >= 0 && absZ >= absX && absZ >= absY) dst.x = 4;
  if (src0.z < 0 && absZ >= absX && absZ >= absY) dst.x = 5;
  """)
  
+# Sum of vector components
+unop_reduce("fsum", 1, tfloat, tfloat, "{src}", "{src0} + {src1}", "{src}")
  
  def binop_convert(name, out_type, in_type, alg_props, const_expr):
     opcode(name, 0, out_type, [0, 0], [in_type, in_type],
diff --git a/src/compiler/nir/nir_opt_algebraic.py b/src/compiler/nir/nir_opt_algebraic.py

index 351f467b24682653afecac9d511f181f8683b8e5..9fc3be8f8b0930d6afa5772b04255432fd9f6e21 100644 (file)
--- a/src/compiler/nir/nir_opt_algebraic.py
+++ b/src/compiler/nir/nir_opt_algebraic.py
@@ -194,6 +194,12 @@ optimizations = [
     (('fdot2', ('vec2', a, 0.0), b), ('fmul', a, b)),
     (('fdot2', a, 1.0), ('fadd', 'a.x', 'a.y')),
  
+   # Lower fdot to fsum when it is available
+   (('fdot2', a, b), ('fsum2', ('fmul', a, b)), 'options->lower_fdot'),
+   (('fdot3', a, b), ('fsum3', ('fmul', a, b)), 'options->lower_fdot'),
+   (('fdot4', a, b), ('fsum4', ('fmul', a, b)), 'options->lower_fdot'),
+   (('fsum2', a), ('fadd', 'a.x', 'a.y'), 'options->lower_fdot'),
+
     # If x >= 0 and x <= 1: fsat(1 - x) == 1 - fsat(x) trivially
     # If x < 0: 1 - fsat(x) => 1 - 0 => 1 and fsat(1 - x) => fsat(> 1) => 1
     # If x > 1: 1 - fsat(x) => 1 - 1 => 0 and fsat(1 - x) => fsat(< 0) => 0
author	Erico Nunes <nunes.erico@gmail.com>
	Sat, 27 Jul 2019 15:58:53 +0000 (17:58 +0200)
committer	Erico Nunes <nunes.erico@gmail.com>
	Wed, 31 Jul 2019 19:35:58 +0000 (21:35 +0200)
src/compiler/nir/nir.h		patch \| blob \| history
src/compiler/nir/nir_opcodes.py		patch \| blob \| history
src/compiler/nir/nir_opt_algebraic.py		patch \| blob \| history