summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorSimon Pilgrim <llvm-dev@redking.me.uk>2017-02-13 14:20:13 +0000
committerSimon Pilgrim <llvm-dev@redking.me.uk>2017-02-13 14:20:13 +0000
commitce2cb2d9684aa8d17aa75c4aebbcc25e720da521 (patch)
tree5b973857778352043415c562f2f32df8a309a140
parent490d4a6da6abf2d97c466ff2a160b5051336060a (diff)
downloadbcm5719-llvm-ce2cb2d9684aa8d17aa75c4aebbcc25e720da521.tar.gz
bcm5719-llvm-ce2cb2d9684aa8d17aa75c4aebbcc25e720da521.zip
[X86][SSE] Add v4f32 and v2f64 extract to store tests
llvm-svn: 294952
-rw-r--r--llvm/test/CodeGen/X86/extract-store.ll147
1 files changed, 147 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/X86/extract-store.ll b/llvm/test/CodeGen/X86/extract-store.ll
index c4bca3f68d7..fda56f94000 100644
--- a/llvm/test/CodeGen/X86/extract-store.ll
+++ b/llvm/test/CodeGen/X86/extract-store.ll
@@ -359,6 +359,127 @@ define void @extract_i64_1(i64* nocapture %dst, <2 x i64> %foo) nounwind {
ret void
}
+define void @extract_f32_0(float* nocapture %dst, <4 x float> %foo) nounwind {
+; SSE-X32-LABEL: extract_f32_0:
+; SSE-X32: # BB#0:
+; SSE-X32-NEXT: movl {{[0-9]+}}(%esp), %eax
+; SSE-X32-NEXT: movss %xmm0, (%eax)
+; SSE-X32-NEXT: retl
+;
+; SSE-X64-LABEL: extract_f32_0:
+; SSE-X64: # BB#0:
+; SSE-X64-NEXT: movss %xmm0, (%rdi)
+; SSE-X64-NEXT: retq
+;
+; AVX-X32-LABEL: extract_f32_0:
+; AVX-X32: # BB#0:
+; AVX-X32-NEXT: movl {{[0-9]+}}(%esp), %eax
+; AVX-X32-NEXT: vmovss %xmm0, (%eax)
+; AVX-X32-NEXT: retl
+;
+; AVX-X64-LABEL: extract_f32_0:
+; AVX-X64: # BB#0:
+; AVX-X64-NEXT: vmovss %xmm0, (%rdi)
+; AVX-X64-NEXT: retq
+ %vecext = extractelement <4 x float> %foo, i32 0
+ store float %vecext, float* %dst, align 1
+ ret void
+}
+
+define void @extract_f32_3(float* nocapture %dst, <4 x float> %foo) nounwind {
+; SSE2-X32-LABEL: extract_f32_3:
+; SSE2-X32: # BB#0:
+; SSE2-X32-NEXT: movl {{[0-9]+}}(%esp), %eax
+; SSE2-X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3]
+; SSE2-X32-NEXT: movss %xmm0, (%eax)
+; SSE2-X32-NEXT: retl
+;
+; SSE2-X64-LABEL: extract_f32_3:
+; SSE2-X64: # BB#0:
+; SSE2-X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3]
+; SSE2-X64-NEXT: movss %xmm0, (%rdi)
+; SSE2-X64-NEXT: retq
+;
+; SSE41-X32-LABEL: extract_f32_3:
+; SSE41-X32: # BB#0:
+; SSE41-X32-NEXT: movl {{[0-9]+}}(%esp), %eax
+; SSE41-X32-NEXT: extractps $3, %xmm0, (%eax)
+; SSE41-X32-NEXT: retl
+;
+; SSE41-X64-LABEL: extract_f32_3:
+; SSE41-X64: # BB#0:
+; SSE41-X64-NEXT: extractps $3, %xmm0, (%rdi)
+; SSE41-X64-NEXT: retq
+;
+; AVX-X32-LABEL: extract_f32_3:
+; AVX-X32: # BB#0:
+; AVX-X32-NEXT: movl {{[0-9]+}}(%esp), %eax
+; AVX-X32-NEXT: vextractps $3, %xmm0, (%eax)
+; AVX-X32-NEXT: retl
+;
+; AVX-X64-LABEL: extract_f32_3:
+; AVX-X64: # BB#0:
+; AVX-X64-NEXT: vextractps $3, %xmm0, (%rdi)
+; AVX-X64-NEXT: retq
+ %vecext = extractelement <4 x float> %foo, i32 3
+ store float %vecext, float* %dst, align 1
+ ret void
+}
+
+define void @extract_f64_0(double* nocapture %dst, <2 x double> %foo) nounwind {
+; SSE-X32-LABEL: extract_f64_0:
+; SSE-X32: # BB#0:
+; SSE-X32-NEXT: movl {{[0-9]+}}(%esp), %eax
+; SSE-X32-NEXT: movlps %xmm0, (%eax)
+; SSE-X32-NEXT: retl
+;
+; SSE-X64-LABEL: extract_f64_0:
+; SSE-X64: # BB#0:
+; SSE-X64-NEXT: movlps %xmm0, (%rdi)
+; SSE-X64-NEXT: retq
+;
+; AVX-X32-LABEL: extract_f64_0:
+; AVX-X32: # BB#0:
+; AVX-X32-NEXT: movl {{[0-9]+}}(%esp), %eax
+; AVX-X32-NEXT: vmovlps %xmm0, (%eax)
+; AVX-X32-NEXT: retl
+;
+; AVX-X64-LABEL: extract_f64_0:
+; AVX-X64: # BB#0:
+; AVX-X64-NEXT: vmovlps %xmm0, (%rdi)
+; AVX-X64-NEXT: retq
+ %vecext = extractelement <2 x double> %foo, i32 0
+ store double %vecext, double* %dst, align 1
+ ret void
+}
+
+define void @extract_f64_1(double* nocapture %dst, <2 x double> %foo) nounwind {
+; SSE-X32-LABEL: extract_f64_1:
+; SSE-X32: # BB#0:
+; SSE-X32-NEXT: movl {{[0-9]+}}(%esp), %eax
+; SSE-X32-NEXT: movhpd %xmm0, (%eax)
+; SSE-X32-NEXT: retl
+;
+; SSE-X64-LABEL: extract_f64_1:
+; SSE-X64: # BB#0:
+; SSE-X64-NEXT: movhpd %xmm0, (%rdi)
+; SSE-X64-NEXT: retq
+;
+; AVX-X32-LABEL: extract_f64_1:
+; AVX-X32: # BB#0:
+; AVX-X32-NEXT: movl {{[0-9]+}}(%esp), %eax
+; AVX-X32-NEXT: vmovhpd %xmm0, (%eax)
+; AVX-X32-NEXT: retl
+;
+; AVX-X64-LABEL: extract_f64_1:
+; AVX-X64: # BB#0:
+; AVX-X64-NEXT: vmovhpd %xmm0, (%rdi)
+; AVX-X64-NEXT: retq
+ %vecext = extractelement <2 x double> %foo, i32 1
+ store double %vecext, double* %dst, align 1
+ ret void
+}
+
define void @extract_i8_undef(i8* nocapture %dst, <16 x i8> %foo) nounwind {
; X32-LABEL: extract_i8_undef:
; X32: # BB#0:
@@ -410,3 +531,29 @@ define void @extract_i64_undef(i64* nocapture %dst, <2 x i64> %foo) nounwind {
store i64 %vecext, i64* %dst, align 1
ret void
}
+
+define void @extract_f32_undef(float* nocapture %dst, <4 x float> %foo) nounwind {
+; X32-LABEL: extract_f32_undef:
+; X32: # BB#0:
+; X32-NEXT: retl
+;
+; X64-LABEL: extract_f32_undef:
+; X64: # BB#0:
+; X64-NEXT: retq
+ %vecext = extractelement <4 x float> %foo, i32 6 ; undef
+ store float %vecext, float* %dst, align 1
+ ret void
+}
+
+define void @extract_f64_undef(double* nocapture %dst, <2 x double> %foo) nounwind {
+; X32-LABEL: extract_f64_undef:
+; X32: # BB#0:
+; X32-NEXT: retl
+;
+; X64-LABEL: extract_f64_undef:
+; X64: # BB#0:
+; X64-NEXT: retq
+ %vecext = extractelement <2 x double> %foo, i32 2 ; undef
+ store double %vecext, double* %dst, align 1
+ ret void
+}
OpenPOWER on IntegriCloud