middle-end: __builtin_mul_overflow expansion improvements [PR95862]

author Jakub Jelinek <jakub@redhat.com>

Wed, 25 Nov 2020 14:42:38 +0000 (15:42 +0100)

committer Jakub Jelinek <jakub@redhat.com>

Wed, 25 Nov 2020 14:42:38 +0000 (15:42 +0100)
author Jakub Jelinek <jakub@redhat.com>
Wed, 25 Nov 2020 14:42:38 +0000 (15:42 +0100)
committer Jakub Jelinek <jakub@redhat.com>
Wed, 25 Nov 2020 14:42:38 +0000 (15:42 +0100)
diff --git a/gcc/internal-fn.c b/gcc/internal-fn.c

index 792d2ca568a4a11c3e3ad8abf6443f173b0650a7..7dad8da4031cdae0523b2e88458386fe4eb10f21 100644 (file)
--- a/gcc/internal-fn.c
+++ b/gcc/internal-fn.c
@@ -553,6 +553,16 @@ get_min_precision (tree arg, signop sign)
        if (++cnt > 30)
         return prec + (orig_sign != sign);
      }
+  if (CONVERT_EXPR_P (arg)
+      && INTEGRAL_TYPE_P (TREE_TYPE (TREE_OPERAND (arg, 0)))
+      && TYPE_PRECISION (TREE_TYPE (TREE_OPERAND (arg, 0))) > prec)
+    {
+      /* We have e.g. (unsigned short) y_2 where int y_2 = (int) x_1(D);
+        If y_2's min precision is smaller than prec, return that.  */
+      int oprec = get_min_precision (TREE_OPERAND (arg, 0), sign);
+      if (oprec < prec)
+       return oprec + (orig_sign != sign);
+    }
    if (TREE_CODE (arg) != SSA_NAME)
      return prec + (orig_sign != sign);
    wide_int arg_min, arg_max;
@@ -1357,6 +1367,37 @@ expand_mul_overflow (location_t loc, tree lhs, tree arg0, tree arg1,
                                    NULL, done_label, profile_probability::very_likely ());
           goto do_error_label;
         case 3:
+         if (get_min_precision (arg1, UNSIGNED)
+             + get_min_precision (arg0, SIGNED) <= GET_MODE_PRECISION (mode))
+           {
+             /* If the first operand is sign extended from narrower type, the
+                second operand is zero extended from narrower type and
+                the sum of the two precisions is smaller or equal to the
+                result precision: if the first argument is at runtime
+                non-negative, maximum result will be 0x7e81 or 0x7f..fe80..01
+                and there will be no overflow, if the first argument is
+                negative and the second argument zero, the result will be
+                0 and there will be no overflow, if the first argument is
+                negative and the second argument positive, the result when
+                treated as signed will be negative (minimum -0x7f80 or
+                -0x7f..f80..0) there there will be always overflow.  So, do
+                res = (U) (s1 * u2)
+                ovf = (S) res < 0  */
+             struct separate_ops ops;
+             ops.code = MULT_EXPR;
+             ops.type
+               = build_nonstandard_integer_type (GET_MODE_PRECISION (mode),
+                                                 1);
+             ops.op0 = make_tree (ops.type, op0);
+             ops.op1 = make_tree (ops.type, op1);
+             ops.op2 = NULL_TREE;
+             ops.location = loc;
+             res = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
+             do_compare_rtx_and_jump (res, const0_rtx, GE, false,
+                                      mode, NULL_RTX, NULL, done_label,
+                                      profile_probability::very_likely ());
+             goto do_error_label;
+           }
           rtx_code_label *do_main_label;
           do_main_label = gen_label_rtx ();
           do_compare_rtx_and_jump (op0, const0_rtx, GE, false, mode, NULL_RTX,
@@ -1374,7 +1415,16 @@ expand_mul_overflow (location_t loc, tree lhs, tree arg0, tree arg1,
    /* u1 * u2 -> sr  */
    if (uns0_p && uns1_p && !unsr_p)
      {
-      uns = true;
+      if ((pos_neg0 | pos_neg1) == 1)
+       {
+         /* If both arguments are zero extended from narrower types,
+            the MSB will be clear on both and so we can pretend it is
+            a normal s1 * s2 -> sr multiplication.  */
+         uns0_p = false;
+         uns1_p = false;
+       }
+      else
+       uns = true;
        /* Rest of handling of this case after res is computed.  */
        goto do_main;
      }
@@ -1455,6 +1505,37 @@ expand_mul_overflow (location_t loc, tree lhs, tree arg0, tree arg1,
                                        profile_probability::very_likely ());
               goto do_error_label;
             }
+         if (get_min_precision (arg0, SIGNED)
+             + get_min_precision (arg1, SIGNED) <= GET_MODE_PRECISION (mode))
+           {
+             /* If both operands are sign extended from narrower types and
+                the sum of the two precisions is smaller or equal to the
+                result precision: if both arguments are at runtime
+                non-negative, maximum result will be 0x3f01 or 0x3f..f0..01
+                and there will be no overflow, if both arguments are negative,
+                maximum result will be 0x40..00 and there will be no overflow
+                either, if one argument is positive and the other argument
+                negative, the result when treated as signed will be negative
+                and there will be always overflow, and if one argument is
+                zero and the other negative the result will be zero and no
+                overflow.  So, do
+                res = (U) (s1 * s2)
+                ovf = (S) res < 0  */
+             struct separate_ops ops;
+             ops.code = MULT_EXPR;
+             ops.type
+               = build_nonstandard_integer_type (GET_MODE_PRECISION (mode),
+                                                 1);
+             ops.op0 = make_tree (ops.type, op0);
+             ops.op1 = make_tree (ops.type, op1);
+             ops.op2 = NULL_TREE;
+             ops.location = loc;
+             res = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
+             do_compare_rtx_and_jump (res, const0_rtx, GE, false,
+                                      mode, NULL_RTX, NULL, done_label,
+                                      profile_probability::very_likely ());
+             goto do_error_label;
+           }
           /* The general case, do all the needed comparisons at runtime.  */
           rtx_code_label *do_main_label, *after_negate_label;
           rtx rop0, rop1;
diff --git a/gcc/testsuite/gcc.dg/builtin-artih-overflow-5.c b/gcc/testsuite/gcc.dg/builtin-artih-overflow-5.c

new file mode 100644 (file)

index 0000000..b43fd18
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/builtin-artih-overflow-5.c
@@ -0,0 +1,87 @@
+/* PR rtl-optimization/95862 */
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+int
+f1 (int a, int b)
+{
+  unsigned long long c;
+  return __builtin_mul_overflow (a, b, &c);
+}
+
+int
+f2 (int a, unsigned b)
+{
+  unsigned long long c;
+  return __builtin_mul_overflow (a, b, &c);
+}
+
+int
+f3 (unsigned a, unsigned b)
+{
+  long long c;
+  return __builtin_mul_overflow (a, b, &c);
+}
+
+int
+f4 (int a, unsigned b)
+{
+  long long c;
+  return __builtin_mul_overflow (a, b, &c);
+}
+
+short
+f5 (short a, short b)
+{
+  unsigned c;
+  return __builtin_mul_overflow (a, b, &c);
+}
+
+short
+f6 (short a, unsigned short b)
+{
+  unsigned c;
+  return __builtin_mul_overflow (a, b, &c);
+}
+
+short
+f7 (unsigned short a, unsigned short b)
+{
+  int c;
+  return __builtin_mul_overflow (a, b, &c);
+}
+
+short
+f8 (short a, unsigned short b)
+{
+  int c;
+  return __builtin_mul_overflow (a, b, &c);
+}
+
+signed char
+f9 (signed char a, signed char b)
+{
+  unsigned short c;
+  return __builtin_mul_overflow (a, b, &c);
+}
+
+signed char
+f10 (signed char a, unsigned char b)
+{
+  unsigned short c;
+  return __builtin_mul_overflow (a, b, &c);
+}
+
+signed char
+f11 (unsigned char a, unsigned char b)
+{
+  short c;
+  return __builtin_mul_overflow (a, b, &c);
+}
+
+signed char
+f12 (signed char a, unsigned char b)
+{
+  short c;
+  return __builtin_mul_overflow (a, b, &c);
+}
author	Jakub Jelinek <jakub@redhat.com>
	Wed, 25 Nov 2020 14:42:38 +0000 (15:42 +0100)
committer	Jakub Jelinek <jakub@redhat.com>
	Wed, 25 Nov 2020 14:42:38 +0000 (15:42 +0100)
gcc/internal-fn.c		patch \| blob \| history
gcc/testsuite/gcc.dg/builtin-artih-overflow-5.c	[new file with mode: 0644]	patch \| blob