summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorSimon Pilgrim <llvm-dev@redking.me.uk>2017-09-24 13:45:49 +0000
committerSimon Pilgrim <llvm-dev@redking.me.uk>2017-09-24 13:45:49 +0000
commite1335b1c754833ae5daa6e7dc3b0021bce9cc137 (patch)
tree1b202bc71628b2897c13f4daf7713064a8337f7d
parenta705db9a9e9c255cee20dd27d2551b6eadb99e4b (diff)
downloadbcm5719-llvm-e1335b1c754833ae5daa6e7dc3b0021bce9cc137.tar.gz
bcm5719-llvm-e1335b1c754833ae5daa6e7dc3b0021bce9cc137.zip
[X86][SSE] Add more tests for shuffle combining with extracted vector elements (PR22415)
llvm-svn: 314077
-rw-r--r--llvm/test/CodeGen/X86/vector-shuffle-combining-ssse3.ll56
1 files changed, 56 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/X86/vector-shuffle-combining-ssse3.ll b/llvm/test/CodeGen/X86/vector-shuffle-combining-ssse3.ll
index 4b6c8179487..a11cac0b9bd 100644
--- a/llvm/test/CodeGen/X86/vector-shuffle-combining-ssse3.ll
+++ b/llvm/test/CodeGen/X86/vector-shuffle-combining-ssse3.ll
@@ -689,6 +689,62 @@ define <16 x i8> @constant_fold_pshufb_2() {
ret <16 x i8> %1
}
+define i32 @mask_zzz3_v16i8(<16 x i8> %a0) {
+; SSSE3-LABEL: mask_zzz3_v16i8:
+; SSSE3: # BB#0:
+; SSSE3-NEXT: pshufb {{.*#+}} xmm0 = xmm0[8,10,12,14,8,10,12,14,0,2,4,6,8,10,12,14]
+; SSSE3-NEXT: movd %xmm0, %eax
+; SSSE3-NEXT: andl $-16777216, %eax # imm = 0xFF000000
+; SSSE3-NEXT: retq
+;
+; SSE41-LABEL: mask_zzz3_v16i8:
+; SSE41: # BB#0:
+; SSE41-NEXT: pshufb {{.*#+}} xmm0 = xmm0[0,2,4,6,8,10,12,14,0,2,4,6,8,10,12,14]
+; SSE41-NEXT: pextrd $3, %xmm0, %eax
+; SSE41-NEXT: andl $-16777216, %eax # imm = 0xFF000000
+; SSE41-NEXT: retq
+;
+; AVX-LABEL: mask_zzz3_v16i8:
+; AVX: # BB#0:
+; AVX-NEXT: vpshufb {{.*#+}} xmm0 = xmm0[0,2,4,6,8,10,12,14,0,2,4,6,8,10,12,14]
+; AVX-NEXT: vpextrd $3, %xmm0, %eax
+; AVX-NEXT: andl $-16777216, %eax # imm = 0xFF000000
+; AVX-NEXT: retq
+ %1 = call <16 x i8> @llvm.x86.ssse3.pshuf.b.128(<16 x i8> %a0, <16 x i8> <i8 0, i8 2, i8 4, i8 6, i8 8, i8 10, i8 12, i8 14, i8 0, i8 2, i8 4, i8 6, i8 8, i8 10, i8 12, i8 14>)
+ %2 = bitcast <16 x i8> %1 to <4 x i32>
+ %3 = extractelement <4 x i32> %2, i32 3
+ %4 = and i32 %3, 4278190080
+ ret i32 %4
+}
+
+define i32 @mask_z1z3_v16i8(<16 x i8> %a0) {
+; SSSE3-LABEL: mask_z1z3_v16i8:
+; SSSE3: # BB#0:
+; SSSE3-NEXT: pshufb {{.*#+}} xmm0 = xmm0[8,10,12,14,8,10,12,14,0,2,4,6,8,10,12,14]
+; SSSE3-NEXT: movd %xmm0, %eax
+; SSSE3-NEXT: andl $-16711936, %eax # imm = 0xFF00FF00
+; SSSE3-NEXT: retq
+;
+; SSE41-LABEL: mask_z1z3_v16i8:
+; SSE41: # BB#0:
+; SSE41-NEXT: pshufb {{.*#+}} xmm0 = xmm0[0,2,4,6,8,10,12,14,0,2,4,6,8,10,12,14]
+; SSE41-NEXT: pextrd $3, %xmm0, %eax
+; SSE41-NEXT: andl $-16711936, %eax # imm = 0xFF00FF00
+; SSE41-NEXT: retq
+;
+; AVX-LABEL: mask_z1z3_v16i8:
+; AVX: # BB#0:
+; AVX-NEXT: vpshufb {{.*#+}} xmm0 = xmm0[0,2,4,6,8,10,12,14,0,2,4,6,8,10,12,14]
+; AVX-NEXT: vpextrd $3, %xmm0, %eax
+; AVX-NEXT: andl $-16711936, %eax # imm = 0xFF00FF00
+; AVX-NEXT: retq
+ %1 = call <16 x i8> @llvm.x86.ssse3.pshuf.b.128(<16 x i8> %a0, <16 x i8> <i8 0, i8 2, i8 4, i8 6, i8 8, i8 10, i8 12, i8 14, i8 0, i8 2, i8 4, i8 6, i8 8, i8 10, i8 12, i8 14>)
+ %2 = bitcast <16 x i8> %1 to <4 x i32>
+ %3 = extractelement <4 x i32> %2, i32 3
+ %4 = and i32 %3, 4278255360
+ ret i32 %4
+}
+
define i32 @PR22415(double %a0) {
; SSE-LABEL: PR22415:
; SSE: # BB#0:
OpenPOWER on IntegriCloud