nir: mind rounding mode on fadd, fsub, fmul and fma opcodes

author Samuel Iglesias Gonsálvez <siglesias@igalia.com>

Tue, 12 Feb 2019 14:43:10 +0000 (15:43 +0100)

committer Andres Gomez <agomez@igalia.com>

Tue, 17 Sep 2019 20:39:18 +0000 (23:39 +0300)
author Samuel Iglesias Gonsálvez <siglesias@igalia.com>
Tue, 12 Feb 2019 14:43:10 +0000 (15:43 +0100)
committer Andres Gomez <agomez@igalia.com>
Tue, 17 Sep 2019 20:39:18 +0000 (23:39 +0300)
diff --git a/src/compiler/nir/nir_constant_expressions.py b/src/compiler/nir/nir_constant_expressions.py

index 219d91c1cbd74cd40392a28a71b9fed486f1323a..baba66e5d024fb4762f8c8be7b89c0d776ee1a84 100644 (file)
--- a/src/compiler/nir/nir_constant_expressions.py
+++ b/src/compiler/nir/nir_constant_expressions.py
@@ -64,6 +64,7 @@ template = """\
  #include "util/rounding.h" /* for _mesa_roundeven */
  #include "util/half_float.h"
  #include "util/double.h"
+#include "util/softfloat.h"
  #include "util/bigmath.h"
  #include "nir_constant_expressions.h"
  
diff --git a/src/compiler/nir/nir_opcodes.py b/src/compiler/nir/nir_opcodes.py

index 13f64d78c4ff053a9246c7e302875278f2767d8e..5a1c8fd25148532f8af4af90c319b7dce1a5c318 100644 (file)
--- a/src/compiler/nir/nir_opcodes.py
+++ b/src/compiler/nir/nir_opcodes.py
@@ -492,7 +492,16 @@ def binop_reduce(name, output_size, output_type, src_type, prereduce_expr,
            [4, 4], [src_type, src_type], False, _2src_commutative,
            final(reduce_(reduce_(src0, src1), reduce_(src2, src3))))
  
-binop("fadd", tfloat, _2src_commutative + associative, "src0 + src1")
+binop("fadd", tfloat, _2src_commutative + associative,"""
+if (nir_is_rounding_mode_rtz(execution_mode, bit_size)) {
+   if (bit_size == 64)
+      dst = _mesa_double_add_rtz(src0, src1);
+   else
+      dst = _mesa_double_to_float_rtz((double)src0 + (double)src1);
+} else {
+   dst = src0 + src1;
+}
+""")
  binop("iadd", tint, _2src_commutative + associative, "src0 + src1")
  binop("iadd_sat", tint, _2src_commutative, """
        src1 > 0 ?
@@ -508,10 +517,28 @@ binop("isub_sat", tint, "", """
  """)
  binop("usub_sat", tuint, "", "src0 < src1 ? 0 : src0 - src1")
  
-binop("fsub", tfloat, "", "src0 - src1")
+binop("fsub", tfloat, "", """
+if (nir_is_rounding_mode_rtz(execution_mode, bit_size)) {
+   if (bit_size == 64)
+      dst = _mesa_double_sub_rtz(src0, src1);
+   else
+      dst = _mesa_double_to_float_rtz((double)src0 - (double)src1);
+} else {
+   dst = src0 - src1;
+}
+""")
  binop("isub", tint, "", "src0 - src1")
  
-binop("fmul", tfloat, _2src_commutative + associative, "src0 * src1")
+binop("fmul", tfloat, _2src_commutative + associative, """
+if (nir_is_rounding_mode_rtz(execution_mode, bit_size)) {
+   if (bit_size == 64)
+      dst = _mesa_double_mul_rtz(src0, src1);
+   else
+      dst = _mesa_double_to_float_rtz((double)src0 * (double)src1);
+} else {
+   dst = src0 * src1;
+}
+""")
  # low 32-bits of signed/unsigned integer multiply
  binop("imul", tint, _2src_commutative + associative, "src0 * src1")
  
@@ -834,7 +861,21 @@ def triop_horiz(name, output_size, src1_size, src2_size, src3_size, const_expr):
     [src1_size, src2_size, src3_size],
     [tuint, tuint, tuint], False, "", const_expr)
  
-triop("ffma", tfloat, _2src_commutative, "src0 * src1 + src2")
+triop("ffma", tfloat, _2src_commutative, """
+if (nir_is_rounding_mode_rtz(execution_mode, bit_size)) {
+   if (bit_size == 64)
+      dst = _mesa_double_fma_rtz(src0, src1, src2);
+   else if (bit_size == 32)
+      dst = _mesa_float_fma_rtz(src0, src1, src2);
+   else
+      dst = _mesa_double_to_float_rtz(_mesa_double_fma_rtz(src0, src1, src2));
+} else {
+   if (bit_size == 32)
+      dst = fmaf(src0, src1, src2);
+   else
+      dst = fma(src0, src1, src2);
+}
+""")
  
  triop("flrp", tfloat, "", "src0 * (1 - src2) + src1 * src2")
author	Samuel Iglesias Gonsálvez <siglesias@igalia.com>
	Tue, 12 Feb 2019 14:43:10 +0000 (15:43 +0100)
committer	Andres Gomez <agomez@igalia.com>
	Tue, 17 Sep 2019 20:39:18 +0000 (23:39 +0300)
src/compiler/nir/nir_constant_expressions.py		patch \| blob \| history
src/compiler/nir/nir_opcodes.py		patch \| blob \| history