diff options
-rw-r--r-- | llvm/test/CodeGen/X86/reduce-trunc-shl.ll | 26 |
1 files changed, 20 insertions, 6 deletions
diff --git a/llvm/test/CodeGen/X86/reduce-trunc-shl.ll b/llvm/test/CodeGen/X86/reduce-trunc-shl.ll index 09082ac2162..c073ae02514 100644 --- a/llvm/test/CodeGen/X86/reduce-trunc-shl.ll +++ b/llvm/test/CodeGen/X86/reduce-trunc-shl.ll @@ -1,11 +1,25 @@ -; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+avx2 < %s | FileCheck %s +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=+sse2 | FileCheck %s --check-prefix=SSE2 +; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mattr=+avx2 | FileCheck %s --check-prefix=AVX2 -; CHECK-LABEL: {{^}}trunc_shl_7_v4i32_v4i64: -; CHECK: vpshufd $136, (%rsi), %ymm0 -; CHECK: vpermq $236, %ymm0, %ymm0 -; CHECK: vpslld $7, %xmm0, %xmm0 -; CHECK: vmovdqa %xmm0, (%rdi) define void @trunc_shl_7_v4i32_v4i64(<4 x i32> addrspace(1)* %out, <4 x i64> addrspace(1)* %in) { +; SSE2-LABEL: trunc_shl_7_v4i32_v4i64: +; SSE2: # BB#0: +; SSE2-NEXT: pshufd {{.*#+}} xmm0 = mem[0,2,2,3] +; SSE2-NEXT: pshufd {{.*#+}} xmm1 = mem[0,2,2,3] +; SSE2-NEXT: punpcklqdq {{.*#+}} xmm1 = xmm1[0],xmm0[0] +; SSE2-NEXT: pslld $7, %xmm1 +; SSE2-NEXT: movdqa %xmm1, (%rdi) +; SSE2-NEXT: retq +; +; AVX2-LABEL: trunc_shl_7_v4i32_v4i64: +; AVX2: # BB#0: +; AVX2-NEXT: vpshufd {{.*#+}} ymm0 = mem[0,2,0,2,4,6,4,6] +; AVX2-NEXT: vpermq {{.*#+}} ymm0 = ymm0[0,3,2,3] +; AVX2-NEXT: vpslld $7, %xmm0, %xmm0 +; AVX2-NEXT: vmovdqa %xmm0, (%rdi) +; AVX2-NEXT: vzeroupper +; AVX2-NEXT: retq %val = load <4 x i64>, <4 x i64> addrspace(1)* %in %shl = shl <4 x i64> %val, <i64 7, i64 7, i64 7, i64 7> %trunc = trunc <4 x i64> %shl to <4 x i32> |