nv50/ir: optimize near power-of-twos into shladd

author Rhys Perry <pendingchaos02@gmail.com>

Sat, 18 Aug 2018 14:06:01 +0000 (15:06 +0100)

committer Rhys Perry <pendingchaos02@gmail.com>

Mon, 27 Aug 2018 12:57:01 +0000 (13:57 +0100)
author Rhys Perry <pendingchaos02@gmail.com>
Sat, 18 Aug 2018 14:06:01 +0000 (15:06 +0100)
committer Rhys Perry <pendingchaos02@gmail.com>
Mon, 27 Aug 2018 12:57:01 +0000 (13:57 +0100)
diff --git a/src/gallium/drivers/nouveau/codegen/nv50_ir_peephole.cpp b/src/gallium/drivers/nouveau/codegen/nv50_ir_peephole.cpp

index 30de9f5c82da34d3eaa173f4bc2e110a26cf266d..1ab743705a7ce6b15b58c5fed8197f35cbd2aed3 100644 (file)
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_peephole.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_peephole.cpp
@@ -958,6 +958,9 @@ ConstantFolding::opnd3(Instruction *i, ImmediateValue &imm2)
  bool
  ConstantFolding::createMul(DataType ty, Value *def, Value *a, int64_t b, Value *c)
  {
+   const Target *target = prog->getTarget();
+   int64_t absB = llabs(b);
+
     //a * (2^shl) -> a << shl
     if (b >= 0 && util_is_power_of_two_or_zero64(b)) {
        int shl = util_logbase2_64(b);
@@ -970,6 +973,30 @@ ConstantFolding::createMul(DataType ty, Value *def, Value *a, int64_t b, Value *
        return true;
     }
  
+   //a * (2^shl + 1) -> a << shl + a
+   //a * -(2^shl + 1) -> -a << shl + a
+   //a * (2^shl - 1) -> a << shl - a
+   //a * -(2^shl - 1) -> -a << shl - a
+   if (typeSizeof(ty) == 4 &&
+       (util_is_power_of_two_or_zero64(absB - 1) ||
+        util_is_power_of_two_or_zero64(absB + 1)) &&
+       target->isOpSupported(OP_SHLADD, TYPE_U32)) {
+      bool subA = util_is_power_of_two_or_zero64(absB + 1);
+      int shl = subA ? util_logbase2_64(absB + 1) : util_logbase2_64(absB - 1);
+
+      Value *res = c ? bld.getSSA() : def;
+      Instruction *insn = bld.mkOp3(OP_SHLADD, TYPE_U32, res, a, bld.mkImm(shl), a);
+      if (b < 0)
+         insn->src(0).mod = Modifier(NV50_IR_MOD_NEG);
+      if (subA)
+         insn->src(2).mod = Modifier(NV50_IR_MOD_NEG);
+
+      if (c)
+         bld.mkOp2(OP_ADD, TYPE_U32, def, res, c);
+
+      return true;
+   }
+
     return false;
  }
author	Rhys Perry <pendingchaos02@gmail.com>
	Sat, 18 Aug 2018 14:06:01 +0000 (15:06 +0100)
committer	Rhys Perry <pendingchaos02@gmail.com>
	Mon, 27 Aug 2018 12:57:01 +0000 (13:57 +0100)