diff options
| author | Simon Pilgrim <llvm-dev@redking.me.uk> | 2019-02-10 14:54:57 +0000 |
|---|---|---|
| committer | Simon Pilgrim <llvm-dev@redking.me.uk> | 2019-02-10 14:54:57 +0000 |
| commit | 76683e7b5800abd0b194bfb93ae8c85c60581665 (patch) | |
| tree | 9b7747a7644ab8d12eb0276c5a34b05322334f44 | |
| parent | 2f319420f920a4cf0b11a15a38238e301ba9a375 (diff) | |
| download | bcm5719-llvm-76683e7b5800abd0b194bfb93ae8c85c60581665.tar.gz bcm5719-llvm-76683e7b5800abd0b194bfb93ae8c85c60581665.zip | |
[X86] Add additional tests for funnel undef/zero argument combines
As suggested on D58009
llvm-svn: 353640
| -rw-r--r-- | llvm/test/CodeGen/X86/funnel-shift.ll | 216 |
1 files changed, 216 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/X86/funnel-shift.ll b/llvm/test/CodeGen/X86/funnel-shift.ll index ade636bc3ec..55c1b3ca9ee 100644 --- a/llvm/test/CodeGen/X86/funnel-shift.ll +++ b/llvm/test/CodeGen/X86/funnel-shift.ll @@ -428,6 +428,23 @@ define i32 @fshl_i32_undef1_cst(i32 %a0) nounwind { ret i32 %res } +define i32 @fshl_i32_undef2(i32 %a0, i32 %a1) nounwind { +; X32-SSE2-LABEL: fshl_i32_undef2: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %ecx +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-SSE2-NEXT: shldl %cl, %ecx, %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshl_i32_undef2: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: movl %edi, %eax +; X64-AVX2-NEXT: shldl %cl, %esi, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshl.i32(i32 %a0, i32 %a1, i32 undef) + ret i32 %res +} + define i32 @fshr_i32_undef0(i32 %a0, i32 %a1) nounwind { ; X32-SSE2-LABEL: fshr_i32_undef0: ; X32-SSE2: # %bb.0: @@ -496,6 +513,205 @@ define i32 @fshr_i32_undef1_cst(i32 %a0) nounwind { ret i32 %res } +define i32 @fshr_i32_undef2(i32 %a0, i32 %a1) nounwind { +; X32-SSE2-LABEL: fshr_i32_undef2: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %ecx +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-SSE2-NEXT: shrdl %cl, %ecx, %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshr_i32_undef2: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: movl %esi, %eax +; X64-AVX2-NEXT: shrdl %cl, %edi, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshr.i32(i32 %a0, i32 %a1, i32 undef) + ret i32 %res +} + +; shift zero args + +define i32 @fshl_i32_zero0(i32 %a0, i32 %a1) nounwind { +; X32-SSE2-LABEL: fshl_i32_zero0: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movb {{[0-9]+}}(%esp), %cl +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %edx +; X32-SSE2-NEXT: xorl %eax, %eax +; X32-SSE2-NEXT: shldl %cl, %edx, %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshl_i32_zero0: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: movl %esi, %ecx +; X64-AVX2-NEXT: xorl %eax, %eax +; X64-AVX2-NEXT: # kill: def $cl killed $cl killed $ecx +; X64-AVX2-NEXT: shldl %cl, %edi, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshl.i32(i32 0, i32 %a0, i32 %a1) + ret i32 %res +} + +define i32 @fshl_i32_zero0_cst(i32 %a0) nounwind { +; X32-SSE2-LABEL: fshl_i32_zero0_cst: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %ecx +; X32-SSE2-NEXT: xorl %eax, %eax +; X32-SSE2-NEXT: shldl $9, %ecx, %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshl_i32_zero0_cst: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: xorl %eax, %eax +; X64-AVX2-NEXT: shldl $9, %edi, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshl.i32(i32 0, i32 %a0, i32 9) + ret i32 %res +} + +define i32 @fshl_i32_zero1(i32 %a0, i32 %a1) nounwind { +; X32-SSE2-LABEL: fshl_i32_zero1: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movb {{[0-9]+}}(%esp), %cl +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-SSE2-NEXT: xorl %edx, %edx +; X32-SSE2-NEXT: shldl %cl, %edx, %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshl_i32_zero1: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: movl %esi, %ecx +; X64-AVX2-NEXT: movl %edi, %eax +; X64-AVX2-NEXT: xorl %edx, %edx +; X64-AVX2-NEXT: # kill: def $cl killed $cl killed $ecx +; X64-AVX2-NEXT: shldl %cl, %edx, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshl.i32(i32 %a0, i32 0, i32 %a1) + ret i32 %res +} + +define i32 @fshl_i32_zero1_cst(i32 %a0) nounwind { +; X32-SSE2-LABEL: fshl_i32_zero1_cst: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %ecx +; X32-SSE2-NEXT: xorl %eax, %eax +; X32-SSE2-NEXT: shrdl $23, %ecx, %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshl_i32_zero1_cst: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: xorl %eax, %eax +; X64-AVX2-NEXT: shrdl $23, %edi, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshl.i32(i32 %a0, i32 0, i32 9) + ret i32 %res +} + +define i32 @fshr_i32_zero0(i32 %a0, i32 %a1) nounwind { +; X32-SSE2-LABEL: fshr_i32_zero0: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movb {{[0-9]+}}(%esp), %cl +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-SSE2-NEXT: xorl %edx, %edx +; X32-SSE2-NEXT: shrdl %cl, %edx, %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshr_i32_zero0: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: movl %esi, %ecx +; X64-AVX2-NEXT: movl %edi, %eax +; X64-AVX2-NEXT: xorl %edx, %edx +; X64-AVX2-NEXT: # kill: def $cl killed $cl killed $ecx +; X64-AVX2-NEXT: shrdl %cl, %edx, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshr.i32(i32 0, i32 %a0, i32 %a1) + ret i32 %res +} + +define i32 @fshr_i32_zero0_cst(i32 %a0) nounwind { +; X32-SSE2-LABEL: fshr_i32_zero0_cst: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %ecx +; X32-SSE2-NEXT: xorl %eax, %eax +; X32-SSE2-NEXT: shldl $23, %ecx, %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshr_i32_zero0_cst: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: xorl %eax, %eax +; X64-AVX2-NEXT: shldl $23, %edi, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshr.i32(i32 0, i32 %a0, i32 9) + ret i32 %res +} + +define i32 @fshr_i32_zero1(i32 %a0, i32 %a1) nounwind { +; X32-SSE2-LABEL: fshr_i32_zero1: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movb {{[0-9]+}}(%esp), %cl +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %edx +; X32-SSE2-NEXT: xorl %eax, %eax +; X32-SSE2-NEXT: shrdl %cl, %edx, %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshr_i32_zero1: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: movl %esi, %ecx +; X64-AVX2-NEXT: xorl %eax, %eax +; X64-AVX2-NEXT: # kill: def $cl killed $cl killed $ecx +; X64-AVX2-NEXT: shrdl %cl, %edi, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshr.i32(i32 %a0, i32 0, i32 %a1) + ret i32 %res +} + +define i32 @fshr_i32_zero1_cst(i32 %a0) nounwind { +; X32-SSE2-LABEL: fshr_i32_zero1_cst: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %ecx +; X32-SSE2-NEXT: xorl %eax, %eax +; X32-SSE2-NEXT: shrdl $9, %ecx, %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshr_i32_zero1_cst: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: xorl %eax, %eax +; X64-AVX2-NEXT: shrdl $9, %edi, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshr.i32(i32 %a0, i32 0, i32 9) + ret i32 %res +} + +; shift by zero + +define i32 @fshl_i32_zero2(i32 %a0, i32 %a1) nounwind { +; X32-SSE2-LABEL: fshl_i32_zero2: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshl_i32_zero2: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: movl %edi, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshl.i32(i32 %a0, i32 %a1, i32 0) + ret i32 %res +} + +define i32 @fshr_i32_zero2(i32 %a0, i32 %a1) nounwind { +; X32-SSE2-LABEL: fshr_i32_zero2: +; X32-SSE2: # %bb.0: +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-SSE2-NEXT: retl +; +; X64-AVX2-LABEL: fshr_i32_zero2: +; X64-AVX2: # %bb.0: +; X64-AVX2-NEXT: movl %esi, %eax +; X64-AVX2-NEXT: retq + %res = call i32 @llvm.fshr.i32(i32 %a0, i32 %a1, i32 0) + ret i32 %res +} + ; With constant shift amount, this is 'shrd' or 'shld'. define i32 @fshr_i32_const_shift(i32 %x, i32 %y) nounwind { |

