vect: Account for unused IFN_LOAD_LANES results

author Richard Sandiford <richard.sandiford@arm.com>

Thu, 14 Jan 2021 11:36:25 +0000 (11:36 +0000)

committer Richard Sandiford <richard.sandiford@arm.com>

Thu, 14 Jan 2021 11:36:25 +0000 (11:36 +0000)
author Richard Sandiford <richard.sandiford@arm.com>
Thu, 14 Jan 2021 11:36:25 +0000 (11:36 +0000)
committer Richard Sandiford <richard.sandiford@arm.com>
Thu, 14 Jan 2021 11:36:25 +0000 (11:36 +0000)
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/cost_model_11.c b/gcc/testsuite/gcc.target/aarch64/sve/cost_model_11.c

new file mode 100644 (file)

index 0000000..d9f4ccc
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/sve/cost_model_11.c
@@ -0,0 +1,12 @@
+/* { dg-options "-O2 -ftree-vectorize -msve-vector-bits=128" } */
+
+long
+f (long *x, long *y, long *z, long n)
+{
+  long res = 0;
+  for (long i = 0; i < n; ++i)
+    z[i] = x[i * 4] + y[i * 4];
+  return res;
+}
+
+/* { dg-final { scan-assembler-not {\tld4d\t} } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/mask_struct_load_5.c b/gcc/testsuite/gcc.target/aarch64/sve/mask_struct_load_5.c

index da367e4fd79dc2b1ffde08d6ae0a8b63bf334f39..2a33ee81d1ab1e8d3b4a8a2785ac96216ed25f5a 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/mask_struct_load_5.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/mask_struct_load_5.c
@@ -1,5 +1,5 @@
  /* { dg-do compile } */
-/* { dg-options "-O2 -ftree-vectorize -ffast-math --param aarch64-sve-compare-costs=0" } */
+/* { dg-options "-O2 -ftree-vectorize -ffast-math -fno-vect-cost-model" } */
  
  #include <stdint.h>
  
diff --git a/gcc/tree-vect-stmts.c b/gcc/tree-vect-stmts.c

index 068e49823035f9223cada9e4162e777aa56d1f2e..4d72c4db2f72f33940312876577d7f0b792acecc 100644 (file)
--- a/gcc/tree-vect-stmts.c
+++ b/gcc/tree-vect-stmts.c
@@ -1120,6 +1120,30 @@ vect_model_load_cost (vec_info *vinfo,
       once per group anyhow.  */
    bool first_stmt_p = (first_stmt_info == stmt_info);
  
+  /* An IFN_LOAD_LANES will load all its vector results, regardless of which
+     ones we actually need.  Account for the cost of unused results.  */
+  if (first_stmt_p && !slp_node && memory_access_type == VMAT_LOAD_STORE_LANES)
+    {
+      unsigned int gaps = DR_GROUP_SIZE (first_stmt_info);
+      stmt_vec_info next_stmt_info = first_stmt_info;
+      do
+       {
+         gaps -= 1;
+         next_stmt_info = DR_GROUP_NEXT_ELEMENT (next_stmt_info);
+       }
+      while (next_stmt_info);
+      if (gaps)
+       {
+         if (dump_enabled_p ())
+           dump_printf_loc (MSG_NOTE, vect_location,
+                            "vect_model_load_cost: %d unused vectors.\n",
+                            gaps);
+         vect_get_load_cost (vinfo, stmt_info, ncopies * gaps, false,
+                             &inside_cost, &prologue_cost,
+                             cost_vec, cost_vec, true);
+       }
+    }
+
    /* We assume that the cost of a single load-lanes instruction is
       equivalent to the cost of DR_GROUP_SIZE separate loads.  If a grouped
       access is instead being provided by a load-and-permute operation,
author	Richard Sandiford <richard.sandiford@arm.com>
	Thu, 14 Jan 2021 11:36:25 +0000 (11:36 +0000)
committer	Richard Sandiford <richard.sandiford@arm.com>
	Thu, 14 Jan 2021 11:36:25 +0000 (11:36 +0000)
gcc/testsuite/gcc.target/aarch64/sve/cost_model_11.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/aarch64/sve/mask_struct_load_5.c		patch \| blob \| history
gcc/tree-vect-stmts.c		patch \| blob \| history