i386.opt (mcx16, msahf): New options.

author Uros Bizjak <ubizjak@gmail.com>

Tue, 13 Mar 2007 21:18:33 +0000 (22:18 +0100)

committer Uros Bizjak <uros@gcc.gnu.org>

Tue, 13 Mar 2007 21:18:33 +0000 (22:18 +0100)
author Uros Bizjak <ubizjak@gmail.com>
Tue, 13 Mar 2007 21:18:33 +0000 (22:18 +0100)
committer Uros Bizjak <uros@gcc.gnu.org>
Tue, 13 Mar 2007 21:18:33 +0000 (22:18 +0100)
diff --git a/gcc/ChangeLog b/gcc/ChangeLog

index 2006f4819338ec72fdc62fe1af15fd0d03b6774d..510f1bcb1e2e8225d68bfda2f4bb90434a464fdb 100644 (file)
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,3 +1,16 @@
+2007-03-13  Uros Bizjak  <ubizjak@gmail.com>
+
+       * config/i386/i386.opt (mcx16, msahf): New options.
+       * config/i386/i386.c (x86_cmpxchg16b, x86_sahf): Remove.
+       (ix86_tune_features) [X86_TUNE_USE_SAHF]: Enable for m_GENERIC.
+
+       * config/i386/driver-i386.c (bit_LAHF_LM): New define.
+       (host_detect_local_cpu): Detect cx16 and lahf_lm cpuid bits.
+       Output -mcx16 and -msahf options when corresponding bit is set.
+
+       * doc/invoke.texi (i386 and x86-64 Options): Document -mcx16
+       and -msahf options.
+
  2007-03-13  Alexandre Oliva  <aoliva@redhat.com>
  
         * configure.ac: Test for assembler tolerance to # 0 "".
diff --git a/gcc/config/i386/driver-i386.c b/gcc/config/i386/driver-i386.c

index 3a5d29de30df113518c2d513596bb1667bdee060..a4155373f1a343d436ebe5d118aa496d66778cc4 100644 (file)
--- a/gcc/config/i386/driver-i386.c
+++ b/gcc/config/i386/driver-i386.c
@@ -43,6 +43,7 @@ const char *host_detect_local_cpu (int argc, const char **argv);
  #define bit_SSE4a (1 << 6)
  #define bit_CMPXCHG16B (1 << 13)
  
+#define bit_LAHF_LM (1 << 0)
  #define bit_3DNOW (1 << 31)
  #define bit_3DNOWP (1 << 30)
  #define bit_LM (1 << 29)
@@ -188,6 +189,7 @@ const char *host_detect_local_cpu (int argc, const char **argv)
  {
    const char *cpu = NULL;
    const char *cache = "";
+  const char *options = "";
    enum processor_type processor = PROCESSOR_I386;
    unsigned int eax, ebx, ecx, edx;
    unsigned int max_level;
@@ -195,6 +197,7 @@ const char *host_detect_local_cpu (int argc, const char **argv)
    unsigned int ext_level;
    unsigned char has_mmx = 0, has_3dnow = 0, has_3dnowp = 0, has_sse = 0;
    unsigned char has_sse2 = 0, has_sse3 = 0, has_ssse3 = 0, has_cmov = 0;
+  unsigned char has_cmpxchg16b = 0, has_lahf_lm = 0;
    unsigned char has_longmode = 0, has_cmpxchg8b = 0, has_sse4a = 0;
    unsigned char is_amd = 0;
    unsigned int family = 0;
@@ -236,6 +239,7 @@ const char *host_detect_local_cpu (int argc, const char **argv)
    has_sse2 = !!(edx & bit_SSE2);
    has_sse3 = !!(ecx & bit_SSE3);
    has_ssse3 = !!(ecx & bit_SSSE3);
+  has_cmpxchg16b = !!(ecx & bit_CMPXCHG16B);
    /* We don't care for extended family.  */
    family = (eax >> 8) & ~(1 << 4);
  
@@ -244,6 +248,7 @@ const char *host_detect_local_cpu (int argc, const char **argv)
    if (ext_level >= 0x80000000)
      {
        cpuid (0x80000001, eax, ebx, ecx, edx);
+      has_lahf_lm = !!(ecx & bit_LAHF_LM);
        has_3dnow = !!(edx & bit_3DNOW);
        has_3dnowp = !!(edx & bit_3DNOWP);
        has_longmode = !!(edx & bit_LM);
@@ -416,8 +421,16 @@ const char *host_detect_local_cpu (int argc, const char **argv)
        break;
      }
  
+  if (arch)
+    {
+      if (has_cmpxchg16b)
+       options = concat (options, "-mcx16 ", NULL);
+      if (has_lahf_lm)
+       options = concat (options, "-msahf ", NULL);
+    }
+
  done:
-  return concat (cache, "-m", argv[0], "=", cpu, NULL);
+  return concat (cache, "-m", argv[0], "=", cpu, " ", options, NULL);
  }
  #else
  /* If we aren't compiling with GCC we just provide a minimal
diff --git a/gcc/config/i386/i386.c b/gcc/config/i386/i386.c

index b4928ab5c7117328b8a66f6b7f9ae468df49e0f7..ca5b48a22f2b31be4e4c9f1d8a59b49c335977c2 100644 (file)
--- a/gcc/config/i386/i386.c
+++ b/gcc/config/i386/i386.c
@@ -1040,7 +1040,7 @@ unsigned int ix86_tune_features[X86_TUNE_LAST] = {
    
    /* X86_TUNE_USE_SAHF */
    m_PPRO | m_K6_GEODE | m_K8 | m_AMDFAM10 | m_PENT4
-  | m_NOCONA | m_CORE2 | m_GENERIC32,
+  | m_NOCONA | m_CORE2 | m_GENERIC,
  
    /* X86_TUNE_MOVX: Enable to zero extend integer registers to avoid
       partial dependencies.  */
@@ -1438,14 +1438,6 @@ enum processor_type ix86_arch;
  /* true if sse prefetch instruction is not NOOP.  */
  int x86_prefetch_sse;
  
-/* true if cmpxchg16b is supported.  */
-int x86_cmpxchg16b;
-
-/* true if sahf is supported. Early Intel CPUs with Intel 64
-   lacked LAHF and SAHF instructions supported by AMD64 until
-   introduction of Pentium 4 G1 step in December 2005.  */
-int x86_sahf;
-
  /* ix86_regparm_string as a number */
  static int ix86_regparm;
  
diff --git a/gcc/config/i386/i386.h b/gcc/config/i386/i386.h

index 06655d87dd312bfc54c42591b9a538567eefdd91..6605775d95d307a9d4a3a0410340a91147f15cab 100644 (file)
--- a/gcc/config/i386/i386.h
+++ b/gcc/config/i386/i386.h
@@ -322,17 +322,14 @@ extern unsigned int ix86_arch_features[X86_ARCH_LAST];
  #define TARGET_XADD            ix86_arch_features[X86_ARCH_XADD]
  #define TARGET_BSWAP           ix86_arch_features[X86_ARCH_BSWAP]
  
+#define TARGET_CMPXCHG16B      x86_cmpxchg16b
+#define TARGET_SAHF            x86_sahf
+
  #define TARGET_FISTTP          (TARGET_SSE3 && TARGET_80387)
  
  extern int x86_prefetch_sse;
  #define TARGET_PREFETCH_SSE    x86_prefetch_sse
  
-extern int x86_cmpxchg16b;
-#define TARGET_CMPXCHG16B      x86_cmpxchg16b
-
-extern int x86_sahf;
-#define TARGET_SAHF            x86_sahf
-
  #define ASSEMBLER_DIALECT      (ix86_asm_dialect)
  
  #define TARGET_SSE_MATH                ((ix86_fpmath & FPMATH_SSE) != 0)
diff --git a/gcc/config/i386/i386.opt b/gcc/config/i386/i386.opt

index 61c68074020160dae11302ec67cc933cbdeedf40..d8955ae3a930d7a43821a40354a5a3e6d9fe18a0 100644 (file)
--- a/gcc/config/i386/i386.opt
+++ b/gcc/config/i386/i386.opt
@@ -221,6 +221,14 @@ which include popcnt and lzcnt instructions, for popcount and clz built-ins
  namely __builtin_popcount, __builtin_popcountl, __builtin_popcountll and
  __builtin_clz, __builtin_clzl, __builtin_clzll
  
+mcx16
+Target Report RejectNegative Var(x86_cmpxchg16b)
+Support code generation of cmpxchg16b instruction.
+
+msahf
+Target Report RejectNegative Var(x86_sahf)
+Support code generation of sahf instruction in 64bit x86-64 code
+
  msseregparm
  Target RejectNegative Mask(SSEREGPARM)
  Use SSE register passing conventions for SF and DF mode
diff --git a/gcc/doc/invoke.texi b/gcc/doc/invoke.texi

index 61e82c30cffbc2b78250c4d137dfa20922ac18db..d5a5da581041c5d7a92c6fa45fc6713bc7d23222 100644 (file)
--- a/gcc/doc/invoke.texi
+++ b/gcc/doc/invoke.texi
@@ -543,7 +543,7 @@ Objective-C and Objective-C++ Dialects}.
  -masm=@var{dialect}  -mno-fancy-math-387 @gol
  -mno-fp-ret-in-387  -msoft-float  -msvr3-shlib @gol
  -mno-wide-multiply  -mrtd  -malign-double @gol
--mpreferred-stack-boundary=@var{num} @gol
+-mpreferred-stack-boundary=@var{num} -mcx16 -msahf @gol
  -mmmx  -msse  -msse2 -msse3 -mssse3 -msse4a -m3dnow -mpopcnt -mabm @gol
  -mthreads  -mno-align-stringops  -minline-all-stringops @gol
  -mpush-args  -maccumulate-outgoing-args  -m128bit-long-double @gol
@@ -10081,6 +10081,22 @@ supported architecture, using the appropriate flags.  In particular,
  the file containing the CPU detection code should be compiled without
  these options.
  
+@item -mcx16
+@opindex -mcx16
+This option will enable GCC to use CMPXCHG16B instruction in generated code.
+CMPXCHG16B allows for atomic operations on 128-bit double quadword (or oword)
+data types.  This is useful for high resolution counters that could be updated
+by multiple processors (or cores).  This instruction is generated as part of
+atomic built-in functions: see @ref{Atomic Builtins} for details.
+
+@item -msahf
+@opindex -msahf
+This option will enable GCC to use SAHF instruction in generated code.  Early
+Intel CPUs with Intel 64 lacked LAHF and SAHF instructions supported by AMD64
+until introduction of Pentium 4 G1 step in December 2005.  LAHF and SAHF are
+load and store instructions, respectively, for certain status flags.  These
+instructions are used for virtualization and floating-point condition handling.
+
  @item -mpush-args
  @itemx -mno-push-args
  @opindex mpush-args
diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog

index 3eb5ad10e45650b5be14f18aae026838491b5e01..3c03cb8742ba45710f8727d9fdeba55ec80e65a8 100644 (file)
--- a/gcc/testsuite/ChangeLog
+++ b/gcc/testsuite/ChangeLog
@@ -1,3 +1,7 @@
+2007-03-13  Uros Bizjak  <ubizjak@gmail.com>
+       
+       * testsuite/gcc.target/i386/cmpxchg16b-1.c: New test.
+
  2007-03-12  Seongbae Park <seongbae.park@gmail.com>
  
         * gcc.dg/c90-vla-1.c: Reflect the change of the error message.
diff --git a/gcc/testsuite/gcc.target/i386/cmpxchg16b-1.c b/gcc/testsuite/gcc.target/i386/cmpxchg16b-1.c

new file mode 100644 (file)

index 0000000..5999544
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/cmpxchg16b-1.c
@@ -0,0 +1,13 @@
+/* { dg-do compile { target x86_64-*-* } } */
+/* { dg-options "-O2 -mcx16" } */
+
+typedef int TItype __attribute__ ((mode (TI)));
+
+TItype m_128;
+
+void test(TItype x_128)
+{
+  m_128 = __sync_val_compare_and_swap (&m_128, x_128, m_128);
+}
+
+/* { dg-final { scan-assembler "cmpxchg16b" } } */
author	Uros Bizjak <ubizjak@gmail.com>
	Tue, 13 Mar 2007 21:18:33 +0000 (22:18 +0100)
committer	Uros Bizjak <uros@gcc.gnu.org>
	Tue, 13 Mar 2007 21:18:33 +0000 (22:18 +0100)
gcc/ChangeLog		patch \| blob \| history
gcc/config/i386/driver-i386.c		patch \| blob \| history
gcc/config/i386/i386.c		patch \| blob \| history
gcc/config/i386/i386.h		patch \| blob \| history
gcc/config/i386/i386.opt		patch \| blob \| history
gcc/doc/invoke.texi		patch \| blob \| history
gcc/testsuite/ChangeLog		patch \| blob \| history
gcc/testsuite/gcc.target/i386/cmpxchg16b-1.c	[new file with mode: 0644]	patch \| blob