i386: Emulate MMX mmx_pmaddwd with SSE
authorH.J. Lu <hongjiu.lu@intel.com>
Wed, 15 May 2019 15:08:04 +0000 (15:08 +0000)
committerH.J. Lu <hjl@gcc.gnu.org>
Wed, 15 May 2019 15:08:04 +0000 (08:08 -0700)
Emulate MMX pmaddwd with SSE.  Only SSE register source operand is
allowed.

PR target/89021
* config/i386/mmx.md (mmx_pmaddwd): Also allow TARGET_MMX_WITH_SSE.
(*mmx_pmaddwd): Also allow TARGET_MMX_WITH_SSE.  Add SSE support.

From-SVN: r271220

gcc/ChangeLog
gcc/config/i386/mmx.md

index 7b2a9bb2e5e15c7b7f84303a806435e042483b37..597ba816fd40862c90c8d1fd68d229ff27a3204f 100644 (file)
@@ -1,3 +1,9 @@
+2019-05-15  H.J. Lu  <hongjiu.lu@intel.com>
+
+       PR target/89021
+       * config/i386/mmx.md (mmx_pmaddwd): Also allow TARGET_MMX_WITH_SSE.
+       (*mmx_pmaddwd): Also allow TARGET_MMX_WITH_SSE.  Add SSE support.
+
 2019-05-15  H.J. Lu  <hongjiu.lu@intel.com>
 
        PR target/89021
index d7c3bd45df6a871e6516cf2f788b150d7e1b7c7f..7cbca961a6089327fc6df891cb333b1aa4f31b82 100644 (file)
          (mult:V2SI
            (sign_extend:V2SI
              (vec_select:V2HI
-               (match_operand:V4HI 1 "nonimmediate_operand")
+               (match_operand:V4HI 1 "register_mmxmem_operand")
                (parallel [(const_int 0) (const_int 2)])))
            (sign_extend:V2SI
              (vec_select:V2HI
-               (match_operand:V4HI 2 "nonimmediate_operand")
+               (match_operand:V4HI 2 "register_mmxmem_operand")
                (parallel [(const_int 0) (const_int 2)]))))
          (mult:V2SI
            (sign_extend:V2SI
            (sign_extend:V2SI
              (vec_select:V2HI (match_dup 2)
                (parallel [(const_int 1) (const_int 3)]))))))]
-  "TARGET_MMX"
+  "TARGET_MMX || TARGET_MMX_WITH_SSE"
   "ix86_fixup_binary_operands_no_copy (MULT, V4HImode, operands);")
 
 (define_insn "*mmx_pmaddwd"
-  [(set (match_operand:V2SI 0 "register_operand" "=y")
+  [(set (match_operand:V2SI 0 "register_operand" "=y,x,Yv")
         (plus:V2SI
          (mult:V2SI
            (sign_extend:V2SI
              (vec_select:V2HI
-               (match_operand:V4HI 1 "nonimmediate_operand" "%0")
+               (match_operand:V4HI 1 "register_mmxmem_operand" "%0,0,Yv")
                (parallel [(const_int 0) (const_int 2)])))
            (sign_extend:V2SI
              (vec_select:V2HI
-               (match_operand:V4HI 2 "nonimmediate_operand" "ym")
+               (match_operand:V4HI 2 "register_mmxmem_operand" "ym,x,Yv")
                (parallel [(const_int 0) (const_int 2)]))))
          (mult:V2SI
            (sign_extend:V2SI
            (sign_extend:V2SI
              (vec_select:V2HI (match_dup 2)
                (parallel [(const_int 1) (const_int 3)]))))))]
-  "TARGET_MMX && ix86_binary_operator_ok (MULT, V4HImode, operands)"
-  "pmaddwd\t{%2, %0|%0, %2}"
-  [(set_attr "type" "mmxmul")
-   (set_attr "mode" "DI")])
+  "(TARGET_MMX || TARGET_MMX_WITH_SSE)
+   && ix86_binary_operator_ok (MULT, V4HImode, operands)"
+  "@
+   pmaddwd\t{%2, %0|%0, %2}
+   pmaddwd\t{%2, %0|%0, %2}
+   vpmaddwd\t{%2, %1, %0|%0, %1, %2}"
+  [(set_attr "mmx_isa" "native,x64_noavx,x64_avx")
+   (set_attr "type" "mmxmul,sseiadd,sseiadd")
+   (set_attr "mode" "DI,TI,TI")])
 
 (define_expand "mmx_pmulhrwv4hi3"
   [(set (match_operand:V4HI 0 "register_operand")