Avoid minimum - 1 confusion in vectoriser

author Richard Sandiford <richard.sandiford@linaro.org>

Mon, 3 Jul 2017 16:30:43 +0000 (16:30 +0000)

committer Richard Sandiford <rsandifo@gcc.gnu.org>

Mon, 3 Jul 2017 16:30:43 +0000 (16:30 +0000)
author Richard Sandiford <richard.sandiford@linaro.org>
Mon, 3 Jul 2017 16:30:43 +0000 (16:30 +0000)
committer Richard Sandiford <rsandifo@gcc.gnu.org>
Mon, 3 Jul 2017 16:30:43 +0000 (16:30 +0000)
diff --git a/gcc/ChangeLog b/gcc/ChangeLog

index 8671c4d1b63805b2e2965edf4b188c9718348c26..ae68b7c3ee8fee04f683ddb62b8812e1be82a5a4 100644 (file)
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,3 +1,13 @@
+2017-07-03  Richard Sandiford  <richard.sandiford@linaro.org>
+
+       * tree-vect-loop.c (vect_analyze_loop_2): Treat min_scalar_loop_bound,
+       min_profitable_iters, and th as inclusive lower bounds.
+       Fix LOOP_VINFO_PEELING_FOR_GAPS condition.
+       (vect_estimate_min_profitable_iters): Return inclusive lower bounds
+       for min_profitable_iters and min_profitable_estimate.
+       (vect_transform_loop): Treat th as an inclusive lower bound.
+       * tree-vect-loop-manip.c (vect_loop_versioning): Likewise.
+
  2017-07-03  Dominique d'Humieres  <dominiq@lps.ens.fr>
  
         PR target/81033
diff --git a/gcc/tree-vect-loop-manip.c b/gcc/tree-vect-loop-manip.c

index aa52c50f531dc68046a0849abfc8865cc664cd01..34e4aa246fa10ee9dec1b987a4b9102b5f1dd8f2 100644 (file)
--- a/gcc/tree-vect-loop-manip.c
+++ b/gcc/tree-vect-loop-manip.c
@@ -2142,7 +2142,7 @@ vect_loop_versioning (loop_vec_info loop_vinfo,
    bool version_niter = LOOP_REQUIRES_VERSIONING_FOR_NITERS (loop_vinfo);
  
    if (check_profitability)
-    cond_expr = fold_build2 (GT_EXPR, boolean_type_node, scalar_loop_iters,
+    cond_expr = fold_build2 (GE_EXPR, boolean_type_node, scalar_loop_iters,
                              build_int_cst (TREE_TYPE (scalar_loop_iters),
                                                        th));
  
diff --git a/gcc/tree-vect-loop.c b/gcc/tree-vect-loop.c

index 599a328123598bd9f66704cd206ea15e30067c86..ae41ffaa335b36726af2946df22e5cd3e651429a 100644 (file)
--- a/gcc/tree-vect-loop.c
+++ b/gcc/tree-vect-loop.c
@@ -2135,21 +2135,17 @@ start_over:
        goto again;
      }
  
-  min_scalar_loop_bound = ((PARAM_VALUE (PARAM_MIN_VECT_LOOP_BOUND)
-                           * vectorization_factor) - 1);
+  min_scalar_loop_bound = (PARAM_VALUE (PARAM_MIN_VECT_LOOP_BOUND)
+                          * vectorization_factor);
  
    /* Use the cost model only if it is more conservative than user specified
       threshold.  */
-  th = (unsigned) min_scalar_loop_bound;
-  if (min_profitable_iters
-      && (!min_scalar_loop_bound
-          || min_profitable_iters > min_scalar_loop_bound))
-    th = (unsigned) min_profitable_iters;
+  th = (unsigned) MAX (min_scalar_loop_bound, min_profitable_iters);
  
    LOOP_VINFO_COST_MODEL_THRESHOLD (loop_vinfo) = th;
  
    if (LOOP_VINFO_NITERS_KNOWN_P (loop_vinfo)
-      && LOOP_VINFO_INT_NITERS (loop_vinfo) <= th)
+      && LOOP_VINFO_INT_NITERS (loop_vinfo) < th)
      {
        if (dump_enabled_p ())
         dump_printf_loc (MSG_MISSED_OPTIMIZATION, vect_location,
@@ -2168,7 +2164,7 @@ start_over:
      estimated_niter = max_niter;
    if (estimated_niter != -1
        && ((unsigned HOST_WIDE_INT) estimated_niter
-          <= MAX (th, (unsigned)min_profitable_estimate)))
+          < MAX (th, (unsigned) min_profitable_estimate)))
      {
        if (dump_enabled_p ())
         dump_printf_loc (MSG_MISSED_OPTIMIZATION, vect_location,
@@ -2185,9 +2181,9 @@ start_over:
  
    /* Decide whether we need to create an epilogue loop to handle
       remaining scalar iterations.  */
-  th = ((LOOP_VINFO_COST_MODEL_THRESHOLD (loop_vinfo) + 1)
-        / LOOP_VINFO_VECT_FACTOR (loop_vinfo))
-       * LOOP_VINFO_VECT_FACTOR (loop_vinfo);
+  th = ((LOOP_VINFO_COST_MODEL_THRESHOLD (loop_vinfo)
+        / LOOP_VINFO_VECT_FACTOR (loop_vinfo))
+       * LOOP_VINFO_VECT_FACTOR (loop_vinfo));
  
    if (LOOP_VINFO_NITERS_KNOWN_P (loop_vinfo)
        && LOOP_VINFO_PEELING_FOR_ALIGNMENT (loop_vinfo) > 0)
@@ -2250,7 +2246,7 @@ start_over:
        /* Niters for at least one iteration of vectorized loop.  */
        niters_th += LOOP_VINFO_VECT_FACTOR (loop_vinfo);
        /* One additional iteration because of peeling for gap.  */
-      if (!LOOP_VINFO_PEELING_FOR_GAPS (loop_vinfo))
+      if (LOOP_VINFO_PEELING_FOR_GAPS (loop_vinfo))
         niters_th++;
        if (LOOP_VINFO_COST_MODEL_THRESHOLD (loop_vinfo) < niters_th)
         LOOP_VINFO_COST_MODEL_THRESHOLD (loop_vinfo) = niters_th;
@@ -3550,7 +3546,7 @@ vect_estimate_min_profitable_iters (loop_vec_info loop_vinfo,
    if ((scalar_single_iter_cost * vf) > (int) vec_inside_cost)
      {
        if (vec_outside_cost <= 0)
-        min_profitable_iters = 1;
+        min_profitable_iters = 0;
        else
          {
            min_profitable_iters = ((vec_outside_cost - scalar_outside_cost) * vf
@@ -3591,11 +3587,6 @@ vect_estimate_min_profitable_iters (loop_vec_info loop_vinfo,
    min_profitable_iters =
         min_profitable_iters < vf ? vf : min_profitable_iters;
  
-  /* Because the condition we create is:
-     if (niters <= min_profitable_iters)
-       then skip the vectorized loop.  */
-  min_profitable_iters--;
-
    if (dump_enabled_p ())
      dump_printf_loc (MSG_NOTE, vect_location,
                       "  Runtime profitability threshold = %d\n",
@@ -3611,7 +3602,7 @@ vect_estimate_min_profitable_iters (loop_vec_info loop_vinfo,
       SIC * niters > VIC * ((niters-PL_ITERS-EP_ITERS)/VF) + VOC + SOC  */
  
    if (vec_outside_cost <= 0)
-    min_profitable_estimate = 1;
+    min_profitable_estimate = 0;
    else
      {
        min_profitable_estimate = ((vec_outside_cost + scalar_outside_cost) * vf
@@ -3620,7 +3611,6 @@ vect_estimate_min_profitable_iters (loop_vec_info loop_vinfo,
                                  / ((scalar_single_iter_cost * vf)
                                    - vec_inside_cost);
      }
-  min_profitable_estimate --;
    min_profitable_estimate = MAX (min_profitable_estimate, min_profitable_iters);
    if (dump_enabled_p ())
      dump_printf_loc (MSG_NOTE, vect_location,
@@ -7276,7 +7266,7 @@ vect_transform_loop (loop_vec_info loop_vinfo)
       run at least the vectorization factor number of times checking
       is pointless, too.  */
    th = LOOP_VINFO_COST_MODEL_THRESHOLD (loop_vinfo);
-  if (th >= LOOP_VINFO_VECT_FACTOR (loop_vinfo) - 1
+  if (th >= LOOP_VINFO_VECT_FACTOR (loop_vinfo)
        && !LOOP_VINFO_NITERS_KNOWN_P (loop_vinfo))
      {
        if (dump_enabled_p ())
author	Richard Sandiford <richard.sandiford@linaro.org>
	Mon, 3 Jul 2017 16:30:43 +0000 (16:30 +0000)
committer	Richard Sandiford <rsandifo@gcc.gnu.org>
	Mon, 3 Jul 2017 16:30:43 +0000 (16:30 +0000)
gcc/ChangeLog		patch \| blob \| history
gcc/tree-vect-loop-manip.c		patch \| blob \| history
gcc/tree-vect-loop.c		patch \| blob \| history