From a2ef38b1f94dd108046e702ad46dcd8e9b34625e Mon Sep 17 00:00:00 2001 From: Hans-Peter Nilsson Date: Tue, 16 Feb 2021 22:27:53 +0100 Subject: [PATCH] match.pd: Restrict clz cmp 0 replacement by single_use, PR99142 If we're not going to eliminate the clz, it's better for the comparison to use that result than its input, so we don't extend the lifetime of the input. Also, an additional use of the result is more likely cheaper than a compare of the input, in particular considering that the clz may have made available a non-zero condition matching the original use. The "s" modifier doesn't stop this situation, as the transformation wouldn't result in "an expression with more than one operator"; a gating single_use condition on the result is necessary. gcc: PR tree-optimization/99142 * match.pd (clz cmp 0): Gate replacement on single_use of clz result. gcc/testsuite: PR tree-optimization/99142 * gcc.dg/tree-ssa/pr99142.c: New test. --- gcc/match.pd | 4 ++-- gcc/testsuite/gcc.dg/tree-ssa/pr99142.c | 14 ++++++++++++++ 2 files changed, 16 insertions(+), 2 deletions(-) create mode 100644 gcc/testsuite/gcc.dg/tree-ssa/pr99142.c diff --git a/gcc/match.pd b/gcc/match.pd index e14f69744d7..760f773cf1b 100644 --- a/gcc/match.pd +++ b/gcc/match.pd @@ -6315,8 +6315,8 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT) (for op (eq ne) cmp (lt ge) (simplify - (op (clz:s @0) INTEGER_CST@1) - (if (integer_zerop (@1)) + (op (clz:s@2 @0) INTEGER_CST@1) + (if (integer_zerop (@1) && single_use (@2)) /* clz(X) == 0 is (int)X < 0 and clz(X) != 0 is (int)X >= 0. */ (with { tree stype = signed_type_for (TREE_TYPE (@0)); HOST_WIDE_INT val = 0; diff --git a/gcc/testsuite/gcc.dg/tree-ssa/pr99142.c b/gcc/testsuite/gcc.dg/tree-ssa/pr99142.c new file mode 100644 index 00000000000..1781a89de32 --- /dev/null +++ b/gcc/testsuite/gcc.dg/tree-ssa/pr99142.c @@ -0,0 +1,14 @@ +/* { dg-do compile } */ +/* { dg-options "-O2 -fdump-tree-optimized" } */ +/* { dg-final { scan-tree-dump-not " >= 0\\)" "optimized" } } */ +int f(int a, int *b, int *d) +{ + int c = __builtin_clz(a); + + *b = c; + + if (c != 0) + *d = c; + + return c; +} -- 2.30.2