nir: Don't forget if-uses in new nir_opt_dead_cf liveness check

[mesa.git] / src / compiler / nir / nir_opcodes.py
diff --git a/src/compiler/nir/nir_opcodes.py b/src/compiler/nir/nir_opcodes.py

index ac2bb9cf7116c7b5d2d63d34f70581dd3a81c619..d32005846a625f6c333d2c1974a3c40528909f17 100644 (file)
--- a/src/compiler/nir/nir_opcodes.py
+++ b/src/compiler/nir/nir_opcodes.py
@@ -91,6 +91,7 @@ class Opcode(object):
  tfloat = "float"
  tint = "int"
  tbool = "bool"
+tbool1 = "bool1"
  tbool32 = "bool32"
  tuint = "uint"
  tuint16 = "uint16"
@@ -119,11 +120,11 @@ def type_sizes(type_):
      if type_has_size(type_):
          return [type_size(type_)]
      elif type_ == 'bool':
-        return [32]
+        return [1, 32]
      elif type_ == 'float':
          return [16, 32, 64]
      else:
-        return [8, 16, 32, 64]
+        return [1, 8, 16, 32, 64]
  
  def type_base_type(type_):
      m = _TYPE_SPLIT_RE.match(type_)
@@ -431,6 +432,9 @@ def binop(name, ty, alg_props, const_expr):
     binop_convert(name, ty, ty, alg_props, const_expr)
  
  def binop_compare(name, ty, alg_props, const_expr):
+   binop_convert(name, tbool1, ty, alg_props, const_expr)
+
+def binop_compare32(name, ty, alg_props, const_expr):
     binop_convert(name, tbool32, ty, alg_props, const_expr)
  
  def binop_horiz(name, out_size, out_type, src1_size, src1_type, src2_size,
@@ -462,6 +466,8 @@ def binop_reduce(name, output_size, output_type, src_type, prereduce_expr,
  
  binop("fadd", tfloat, commutative + associative, "src0 + src1")
  binop("iadd", tint, commutative + associative, "src0 + src1")
+binop("uadd_sat", tuint, commutative,
+      "(src0 + src1) < src0 ? UINT64_MAX : (src0 + src1)")
  binop("fsub", tfloat, "", "src0 - src1")
  binop("isub", tint, "", "src0 - src1")
  
@@ -558,16 +564,35 @@ binop_compare("ieq", tint, commutative, "src0 == src1")
  binop_compare("ine", tint, commutative, "src0 != src1")
  binop_compare("ult", tuint, "", "src0 < src1")
  binop_compare("uge", tuint, "", "src0 >= src1")
+binop_compare32("flt32", tfloat, "", "src0 < src1")
+binop_compare32("fge32", tfloat, "", "src0 >= src1")
+binop_compare32("feq32", tfloat, commutative, "src0 == src1")
+binop_compare32("fne32", tfloat, commutative, "src0 != src1")
+binop_compare32("ilt32", tint, "", "src0 < src1")
+binop_compare32("ige32", tint, "", "src0 >= src1")
+binop_compare32("ieq32", tint, commutative, "src0 == src1")
+binop_compare32("ine32", tint, commutative, "src0 != src1")
+binop_compare32("ult32", tuint, "", "src0 < src1")
+binop_compare32("uge32", tuint, "", "src0 >= src1")
  
  # integer-aware GLSL-style comparisons that compare floats and ints
  
-binop_reduce("ball_fequal",  1, tbool32, tfloat, "{src0} == {src1}",
+binop_reduce("ball_fequal",  1, tbool1, tfloat, "{src0} == {src1}",
+             "{src0} && {src1}", "{src}")
+binop_reduce("bany_fnequal", 1, tbool1, tfloat, "{src0} != {src1}",
+             "{src0} || {src1}", "{src}")
+binop_reduce("ball_iequal",  1, tbool1, tint, "{src0} == {src1}",
+             "{src0} && {src1}", "{src}")
+binop_reduce("bany_inequal", 1, tbool1, tint, "{src0} != {src1}",
+             "{src0} || {src1}", "{src}")
+
+binop_reduce("b32all_fequal",  1, tbool32, tfloat, "{src0} == {src1}",
               "{src0} && {src1}", "{src}")
-binop_reduce("bany_fnequal", 1, tbool32, tfloat, "{src0} != {src1}",
+binop_reduce("b32any_fnequal", 1, tbool32, tfloat, "{src0} != {src1}",
               "{src0} || {src1}", "{src}")
-binop_reduce("ball_iequal",  1, tbool32, tint, "{src0} == {src1}",
+binop_reduce("b32all_iequal",  1, tbool32, tint, "{src0} == {src1}",
               "{src0} && {src1}", "{src}")
-binop_reduce("bany_inequal", 1, tbool32, tint, "{src0} != {src1}",
+binop_reduce("b32any_inequal", 1, tbool32, tint, "{src0} != {src1}",
               "{src0} || {src1}", "{src}")
  
  # non-integer-aware GLSL-style comparisons that return 0.0 or 1.0
@@ -755,7 +780,9 @@ triop("imed3", tint, "MAX2(MIN2(MAX2(src0, src1), src2), MIN2(src0, src1))")
  triop("umed3", tuint, "MAX2(MIN2(MAX2(src0, src1), src2), MIN2(src0, src1))")
  
  opcode("bcsel", 0, tuint, [0, 0, 0],
-      [tbool32, tuint, tuint], "", "src0 ? src1 : src2")
+      [tbool1, tuint, tuint], "", "src0 ? src1 : src2")
+opcode("b32csel", 0, tuint, [0, 0, 0],
+       [tbool32, tuint, tuint], "", "src0 ? src1 : src2")
  
  # SM5 bfi assembly
  triop("bfi", tuint32, """