diff options
| author | gganesh <gganesh@138bc75d-0d04-0410-961f-82ee72b054a4> | 2014-08-12 10:07:31 +0000 |
|---|---|---|
| committer | gganesh <gganesh@138bc75d-0d04-0410-961f-82ee72b054a4> | 2014-08-12 10:07:31 +0000 |
| commit | 816faba136b6986370cfc2cebb5a80dc2b158e05 (patch) | |
| tree | 981190c30a47eb0544db4c416444b57f3a242828 | |
| parent | d641d6d57895b5027dc5a407cc5c4f7fe7d628d0 (diff) | |
| download | ppe42-gcc-816faba136b6986370cfc2cebb5a80dc2b158e05.tar.gz ppe42-gcc-816faba136b6986370cfc2cebb5a80dc2b158e05.zip | |
Backport from mainline 64-bit multiplication handling without vpmacsdql instruction
git-svn-id: svn+ssh://gcc.gnu.org/svn/gcc/branches/gcc-4_9-branch@213850 138bc75d-0d04-0410-961f-82ee72b054a4
| -rw-r--r-- | gcc/ChangeLog | 10 | ||||
| -rw-r--r-- | gcc/config/i386/i386.c | 6 | ||||
| -rw-r--r-- | gcc/testsuite/ChangeLog | 9 | ||||
| -rw-r--r-- | gcc/testsuite/gcc.target/i386/xop-imul64-vector.c | 1 |
4 files changed, 23 insertions, 3 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog index de2ef232724..2d77d2656c4 100644 --- a/gcc/ChangeLog +++ b/gcc/ChangeLog @@ -1,3 +1,13 @@ +2014-08-12 Ganesh Gopalasubramanian <Ganesh.Gopalasubramanian@amd.com> + + Backport from mainline + 2014-06-16 Ganesh Gopalasubramanian + <Ganesh.Gopalasubramanian@amd.com> + + * config/i386/i386.c (ix86_expand_sse2_mulvxdi3): Issue + instructions "vpmuludq" and "vpaddq" instead of "vpmacsdql" for + handling 32-bit multiplication. + 2014-08-08 Guozhi Wei <carrot@google.com> * config/rs6000/rs6000.md (*movdi_internal64): Add a new constraint. diff --git a/gcc/config/i386/i386.c b/gcc/config/i386/i386.c index 0a6e6449204..0e0e4158b5c 100644 --- a/gcc/config/i386/i386.c +++ b/gcc/config/i386/i386.c @@ -45092,8 +45092,10 @@ ix86_expand_sse2_mulvxdi3 (rtx op0, rtx op1, rtx op2) /* t4: ((B*E)+(A*F))<<32, ((D*G)+(C*H))<<32 */ emit_insn (gen_ashlv2di3 (t4, t3, GEN_INT (32))); - /* op0: (((B*E)+(A*F))<<32)+(B*F), (((D*G)+(C*H))<<32)+(D*H) */ - emit_insn (gen_xop_pmacsdql (op0, op1, op2, t4)); + /* Multiply lower parts and add all */ + t5 = gen_reg_rtx (V2DImode); + emit_insn (gen_vec_widen_umult_even_v4si (t5, gen_lowpart (V4SImode, op1), gen_lowpart (V4SImode, op2))); + op0 = expand_binop (mode, add_optab, t5, t4, op0, 1, OPTAB_DIRECT); } else { diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog index fbea5545d22..9054e088508 100644 --- a/gcc/testsuite/ChangeLog +++ b/gcc/testsuite/ChangeLog @@ -1,3 +1,12 @@ +2014-08-12 Ganesh Gopalasubramanian <Ganesh.Gopalasubramanian@amd.com> + + Backport from mainline + 2014-06-16 Ganesh Gopalasubramanian + <Ganesh.Gopalasubramanian@amd.com> + + * gcc.target/i386/xop-imul64-vector.c: Remove the check for + vpmacsdql instruction. + 2014-08-11 Janis Johnson <janisjo@codesourcery.com> Backport from mainline diff --git a/gcc/testsuite/gcc.target/i386/xop-imul64-vector.c b/gcc/testsuite/gcc.target/i386/xop-imul64-vector.c index 382677e6050..97ef3935a8b 100644 --- a/gcc/testsuite/gcc.target/i386/xop-imul64-vector.c +++ b/gcc/testsuite/gcc.target/i386/xop-imul64-vector.c @@ -33,4 +33,3 @@ int main () /* { dg-final { scan-assembler "vpmulld" } } */ /* { dg-final { scan-assembler "vphadddq" } } */ -/* { dg-final { scan-assembler "vpmacsdql" } } */ |

