2016-06-22 Ilya Enkovich <ilya.enkovich@intel.com>
- PR middle-end/71488
+ PR tree-optimization/71488
* tree-vect-patterns.c (vect_recog_mask_conversion_pattern): Support
comparison of boolean vectors.
* tree-vect-stmts.c (vectorizable_comparison): Vectorize comparison
+2016-06-23 Uros Bizjak <ubizjak@gmail.com>
+
+ PR tree-optimization/71488
+ * gcc.target/i386/i386.exp (check_effective_target_sse4): Move to ...
+ * lib/target-supports.exp: ... here.
+ (check_sse4_hw_available): New procedure.
+ (check_effective_target_sse4_runtime): Ditto.
+ * g++.dg/pr71488.C (dg-additional-options): Use -msse4 instead of
+ -march=westmere for sse4_runtime targets.
+ * gcc.dg/vect/vect-bool-cmp.c: Include "tree-vect.h".
+ (dg-additional-options): Use for sse4_runtime targets.
+ (main): Call check_vect ().
+ (dg-final): Perform scan only for sse4_runtime targets.
+
2016-06-23 H.J. Lu <hongjiu.lu@intel.com>
PR target/66232
* gcc.target/i386/pr67400-4.c: Likewise.
* gcc.target/i386/pr67400-6.c: Likewise.
* gcc.target/i386/pr67400-7.c: Likewise.
- * lib/target-supports.exp (check_effective_target_got32x_reloc):
- New.
+ * lib/target-supports.exp (check_effective_target_got32x_reloc): New.
2016-06-23 Jerry DeLisle <jvdelisle@gcc.gnu.org>
2016-06-22 Ilya Enkovich <ilya.enkovich@intel.com>
- PR middle-end/71488
+ PR tree-optimization/71488
* g++.dg/pr71488.C: New test.
* gcc.dg/vect/vect-bool-cmp.c: New test.
-// PR middle-end/71488
+// PR tree-optimization/71488
// { dg-do run }
// { dg-options "-O3 -std=c++11" }
-// { dg-additional-options "-march=westmere" { target i?86-*-* x86_64-*-* } }
+// { dg-additional-options "-msse4" { target sse4_runtime } }
// { dg-require-effective-target c++11 }
#include <valarray>
-/* PR71488 */
+/* PR tree-optimization/71488 */
/* { dg-require-effective-target vect_int } */
/* { dg-require-effective-target vect_pack_trunc } */
-/* { dg-additional-options "-msse4" { target { i?86-*-* x86_64-*-* } } } */
+/* { dg-additional-options "-msse4" { target sse4_runtime } } */
+
+#include "tree-vect.h"
int i1, i2;
long long l2[32];
int i;
+ check_vect ();
+
for (i = 0; i < 32; i++)
{
l2[i] = i2[i] = s2[i] = i % 2;
check (res, ne);
}
-/* { dg-final { scan-tree-dump-times "VECTORIZED" 18 "vect" { target { i?86-*-* x86_64-*-* } } } } */
+/* { dg-final { scan-tree-dump-times "VECTORIZED" 18 "vect" { target sse4_runtime } } } */
} "-O2 -mssse3" ]
}
-# Return 1 if sse4 instructions can be compiled.
-proc check_effective_target_sse4 { } {
- return [check_no_compiler_messages sse4.1 object {
- typedef long long __m128i __attribute__ ((__vector_size__ (16)));
- typedef int __v4si __attribute__ ((__vector_size__ (16)));
-
- __m128i _mm_mullo_epi32 (__m128i __X, __m128i __Y)
- {
- return (__m128i) __builtin_ia32_pmulld128 ((__v4si)__X,
- (__v4si)__Y);
- }
- } "-O2 -msse4.1" ]
-}
-
# Return 1 if aes instructions can be compiled.
proc check_effective_target_aes { } {
return [check_no_compiler_messages aes object {
}]
}
+# Return 1 if the target supports executing SSE4 instructions, 0
+# otherwise. Cache the result.
+
+proc check_sse4_hw_available { } {
+ return [check_cached_effective_target sse4_hw_available {
+ # If this is not the right target then we can skip the test.
+ if { !([istarget x86_64-*-*] || [istarget i?86-*-*]) } {
+ expr 0
+ } else {
+ check_runtime_nocache sse4_hw_available {
+ #include "cpuid.h"
+ int main ()
+ {
+ unsigned int eax, ebx, ecx, edx;
+ if (__get_cpuid (1, &eax, &ebx, &ecx, &edx))
+ return !(ecx & bit_SSE4_2);
+ return 1;
+ }
+ } ""
+ }
+ }]
+}
+
# Return 1 if the target supports executing AVX instructions, 0
# otherwise. Cache the result.
return 0
}
+# Return 1 if the target supports running SSE4 executables, 0 otherwise.
+
+proc check_effective_target_sse4_runtime { } {
+ if { [check_effective_target_sse4]
+ && [check_sse4_hw_available]
+ && [check_sse_os_support_available] } {
+ return 1
+ }
+ return 0
+}
+
# Return 1 if the target supports running AVX executables, 0 otherwise.
proc check_effective_target_avx_runtime { } {
} "-O2 -msse2" ]
}
+# Return 1 if sse4.1 instructions can be compiled.
+proc check_effective_target_sse4 { } {
+ return [check_no_compiler_messages sse4.1 object {
+ typedef long long __m128i __attribute__ ((__vector_size__ (16)));
+ typedef int __v4si __attribute__ ((__vector_size__ (16)));
+
+ __m128i _mm_mullo_epi32 (__m128i __X, __m128i __Y)
+ {
+ return (__m128i) __builtin_ia32_pmulld128 ((__v4si)__X,
+ (__v4si)__Y);
+ }
+ } "-O2 -msse4.1" ]
+}
+
# Return 1 if F16C instructions can be compiled.
proc check_effective_target_f16c { } {