summaryrefslogtreecommitdiffstats
path: root/llvm/test/CodeGen
diff options
context:
space:
mode:
authorCraig Topper <craig.topper@gmail.com>2016-07-25 07:20:35 +0000
committerCraig Topper <craig.topper@gmail.com>2016-07-25 07:20:35 +0000
commitce415ff9c5a469aa75f6471ead4318d99f457ac9 (patch)
treeb672e498ea6ecc1f6d47d831188b033ca464d012 /llvm/test/CodeGen
parent318e40b6f71559f97f604951cebcfbaf7ee86e6a (diff)
downloadbcm5719-llvm-ce415ff9c5a469aa75f6471ead4318d99f457ac9.tar.gz
bcm5719-llvm-ce415ff9c5a469aa75f6471ead4318d99f457ac9.zip
[AVX512] Add load folding support for the unmasked forms of the FMA instructions.
llvm-svn: 276615
Diffstat (limited to 'llvm/test/CodeGen')
-rw-r--r--llvm/test/CodeGen/X86/fma_patterns.ll6
-rw-r--r--llvm/test/CodeGen/X86/fma_patterns_wide.ll6
2 files changed, 4 insertions, 8 deletions
diff --git a/llvm/test/CodeGen/X86/fma_patterns.ll b/llvm/test/CodeGen/X86/fma_patterns.ll
index b724da20425..371361ddeef 100644
--- a/llvm/test/CodeGen/X86/fma_patterns.ll
+++ b/llvm/test/CodeGen/X86/fma_patterns.ll
@@ -524,8 +524,7 @@ define <4 x float> @test_4f32_fmadd_load(<4 x float>* %a0, <4 x float> %a1, <4 x
;
; AVX512-LABEL: test_4f32_fmadd_load:
; AVX512: # BB#0:
-; AVX512-NEXT: vmovaps (%rdi), %xmm2
-; AVX512-NEXT: vfmadd213ps %xmm1, %xmm2, %xmm0
+; AVX512-NEXT: vfmadd132ps (%rdi), %xmm1, %xmm0
; AVX512-NEXT: retq
%x = load <4 x float>, <4 x float>* %a0
%y = fmul <4 x float> %x, %a1
@@ -546,8 +545,7 @@ define <2 x double> @test_2f64_fmsub_load(<2 x double>* %a0, <2 x double> %a1, <
;
; AVX512-LABEL: test_2f64_fmsub_load:
; AVX512: # BB#0:
-; AVX512-NEXT: vmovapd (%rdi), %xmm2
-; AVX512-NEXT: vfmsub213pd %xmm1, %xmm2, %xmm0
+; AVX512-NEXT: vfmsub132pd (%rdi), %xmm1, %xmm0
; AVX512-NEXT: retq
%x = load <2 x double>, <2 x double>* %a0
%y = fmul <2 x double> %x, %a1
diff --git a/llvm/test/CodeGen/X86/fma_patterns_wide.ll b/llvm/test/CodeGen/X86/fma_patterns_wide.ll
index 98b6c496e08..2c49bb851c3 100644
--- a/llvm/test/CodeGen/X86/fma_patterns_wide.ll
+++ b/llvm/test/CodeGen/X86/fma_patterns_wide.ll
@@ -217,8 +217,7 @@ define <16 x float> @test_16f32_fmadd_load(<16 x float>* %a0, <16 x float> %a1,
;
; AVX512-LABEL: test_16f32_fmadd_load:
; AVX512: # BB#0:
-; AVX512-NEXT: vmovaps (%rdi), %zmm2
-; AVX512-NEXT: vfmadd213ps %zmm1, %zmm2, %zmm0
+; AVX512-NEXT: vfmadd132ps (%rdi), %zmm1, %zmm0
; AVX512-NEXT: retq
%x = load <16 x float>, <16 x float>* %a0
%y = fmul <16 x float> %x, %a1
@@ -241,8 +240,7 @@ define <8 x double> @test_8f64_fmsub_load(<8 x double>* %a0, <8 x double> %a1, <
;
; AVX512-LABEL: test_8f64_fmsub_load:
; AVX512: # BB#0:
-; AVX512-NEXT: vmovapd (%rdi), %zmm2
-; AVX512-NEXT: vfmsub213pd %zmm1, %zmm2, %zmm0
+; AVX512-NEXT: vfmsub132pd (%rdi), %zmm1, %zmm0
; AVX512-NEXT: retq
%x = load <8 x double>, <8 x double>* %a0
%y = fmul <8 x double> %x, %a1
OpenPOWER on IntegriCloud