diff options
-rw-r--r-- | llvm/test/CodeGen/X86/xor.ll | 550 |
1 files changed, 422 insertions, 128 deletions
diff --git a/llvm/test/CodeGen/X86/xor.ll b/llvm/test/CodeGen/X86/xor.ll index f78fe275786..6f0f0df465c 100644 --- a/llvm/test/CodeGen/X86/xor.ll +++ b/llvm/test/CodeGen/X86/xor.ll @@ -1,172 +1,441 @@ -; RUN: llc < %s -mtriple=i686-unknown -mattr=+sse2 | FileCheck %s -check-prefix=X32 -; RUN: llc < %s -mtriple=x86_64-linux -mattr=+sse2 | FileCheck %s -check-prefix=X64 -; RUN: llc < %s -mtriple=x86_64-win32 -mattr=+sse2 | FileCheck %s -check-prefix=X64 +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc < %s -mtriple=i686-unknown -mattr=+sse2 | FileCheck %s -check-prefixes=X32 +; RUN: llc < %s -mtriple=x86_64-linux -mattr=+sse2 | FileCheck %s -check-prefixes=X64,X64-LIN +; RUN: llc < %s -mtriple=x86_64-win32 -mattr=+sse2 | FileCheck %s -check-prefixes=X64,X64-WIN ; Though it is undefined, we want xor undef,undef to produce zero. define <4 x i32> @test1() nounwind { - %tmp = xor <4 x i32> undef, undef - ret <4 x i32> %tmp - ; X32-LABEL: test1: -; X32: xorps %xmm0, %xmm0 -; X32: ret +; X32: # %bb.0: +; X32-NEXT: xorps %xmm0, %xmm0 +; X32-NEXT: retl +; +; X64-LABEL: test1: +; X64: # %bb.0: +; X64-NEXT: xorps %xmm0, %xmm0 +; X64-NEXT: retq + %tmp = xor <4 x i32> undef, undef + ret <4 x i32> %tmp } ; Though it is undefined, we want xor undef,undef to produce zero. define i32 @test2() nounwind{ - %tmp = xor i32 undef, undef - ret i32 %tmp ; X32-LABEL: test2: -; X32: xorl %eax, %eax -; X32: ret +; X32: # %bb.0: +; X32-NEXT: xorl %eax, %eax +; X32-NEXT: retl +; +; X64-LABEL: test2: +; X64: # %bb.0: +; X64-NEXT: xorl %eax, %eax +; X64-NEXT: retq + %tmp = xor i32 undef, undef + ret i32 %tmp } define i32 @test3(i32 %a, i32 %b) nounwind { -entry: - %tmp1not = xor i32 %b, -2 - %tmp3 = and i32 %tmp1not, %a - %tmp4 = lshr i32 %tmp3, 1 - ret i32 %tmp4 - -; X64-LABEL: test3: -; X64: notl -; X64: andl -; X64: shrl -; X64: ret - ; X32-LABEL: test3: -; X32: movl 8(%esp), %eax -; X32: notl %eax -; X32: andl 4(%esp), %eax -; X32: shrl %eax -; X32: ret +; X32: # %bb.0: # %entry +; X32-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-NEXT: notl %eax +; X32-NEXT: andl {{[0-9]+}}(%esp), %eax +; X32-NEXT: shrl %eax +; X32-NEXT: retl +; +; X64-LIN-LABEL: test3: +; X64-LIN: # %bb.0: # %entry +; X64-LIN-NEXT: notl %esi +; X64-LIN-NEXT: andl %edi, %esi +; X64-LIN-NEXT: shrl %esi +; X64-LIN-NEXT: movl %esi, %eax +; X64-LIN-NEXT: retq +; +; X64-WIN-LABEL: test3: +; X64-WIN: # %bb.0: # %entry +; X64-WIN-NEXT: notl %edx +; X64-WIN-NEXT: andl %ecx, %edx +; X64-WIN-NEXT: shrl %edx +; X64-WIN-NEXT: movl %edx, %eax +; X64-WIN-NEXT: retq +entry: + %tmp1not = xor i32 %b, -2 + %tmp3 = and i32 %tmp1not, %a + %tmp4 = lshr i32 %tmp3, 1 + ret i32 %tmp4 } define i32 @test4(i32 %a, i32 %b) nounwind { +; X32-LABEL: test4: +; X32: # %bb.0: # %entry +; X32-NEXT: movl {{[0-9]+}}(%esp), %ecx +; X32-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-NEXT: .p2align 4, 0x90 +; X32-NEXT: .LBB3_1: # %bb +; X32-NEXT: # =>This Inner Loop Header: Depth=1 +; X32-NEXT: xorl %ecx, %eax +; X32-NEXT: movl %eax, %edx +; X32-NEXT: notl %edx +; X32-NEXT: andl %ecx, %edx +; X32-NEXT: addl %edx, %edx +; X32-NEXT: movl %edx, %ecx +; X32-NEXT: jne .LBB3_1 +; X32-NEXT: # %bb.2: # %bb12 +; X32-NEXT: retl +; +; X64-LIN-LABEL: test4: +; X64-LIN: # %bb.0: # %entry +; X64-LIN-NEXT: .p2align 4, 0x90 +; X64-LIN-NEXT: .LBB3_1: # %bb +; X64-LIN-NEXT: # =>This Inner Loop Header: Depth=1 +; X64-LIN-NEXT: xorl %esi, %edi +; X64-LIN-NEXT: movl %edi, %eax +; X64-LIN-NEXT: notl %eax +; X64-LIN-NEXT: andl %esi, %eax +; X64-LIN-NEXT: addl %eax, %eax +; X64-LIN-NEXT: movl %eax, %esi +; X64-LIN-NEXT: jne .LBB3_1 +; X64-LIN-NEXT: # %bb.2: # %bb12 +; X64-LIN-NEXT: movl %edi, %eax +; X64-LIN-NEXT: retq +; +; X64-WIN-LABEL: test4: +; X64-WIN: # %bb.0: # %entry +; X64-WIN-NEXT: .p2align 4, 0x90 +; X64-WIN-NEXT: .LBB3_1: # %bb +; X64-WIN-NEXT: # =>This Inner Loop Header: Depth=1 +; X64-WIN-NEXT: xorl %edx, %ecx +; X64-WIN-NEXT: movl %ecx, %eax +; X64-WIN-NEXT: notl %eax +; X64-WIN-NEXT: andl %edx, %eax +; X64-WIN-NEXT: addl %eax, %eax +; X64-WIN-NEXT: movl %eax, %edx +; X64-WIN-NEXT: jne .LBB3_1 +; X64-WIN-NEXT: # %bb.2: # %bb12 +; X64-WIN-NEXT: movl %ecx, %eax +; X64-WIN-NEXT: retq entry: - br label %bb + br label %bb bb: - %b_addr.0 = phi i32 [ %b, %entry ], [ %tmp8, %bb ] - %a_addr.0 = phi i32 [ %a, %entry ], [ %tmp3, %bb ] - %tmp3 = xor i32 %a_addr.0, %b_addr.0 - %tmp4not = xor i32 %tmp3, 2147483647 - %tmp6 = and i32 %tmp4not, %b_addr.0 - %tmp8 = shl i32 %tmp6, 1 - %tmp10 = icmp eq i32 %tmp8, 0 - br i1 %tmp10, label %bb12, label %bb + %b_addr.0 = phi i32 [ %b, %entry ], [ %tmp8, %bb ] + %a_addr.0 = phi i32 [ %a, %entry ], [ %tmp3, %bb ] + %tmp3 = xor i32 %a_addr.0, %b_addr.0 + %tmp4not = xor i32 %tmp3, 2147483647 + %tmp6 = and i32 %tmp4not, %b_addr.0 + %tmp8 = shl i32 %tmp6, 1 + %tmp10 = icmp eq i32 %tmp8, 0 + br i1 %tmp10, label %bb12, label %bb bb12: - ret i32 %tmp3 - -; X64-LABEL: test4: -; X64: notl [[REG:%[a-z]+]] -; X64: andl {{.*}}[[REG]] -; X32-LABEL: test4: -; X32: notl [[REG:%[a-z]+]] -; X32: andl {{.*}}[[REG]] + ret i32 %tmp3 } define i16 @test5(i16 %a, i16 %b) nounwind { +; X32-LABEL: test5: +; X32: # %bb.0: # %entry +; X32-NEXT: movzwl {{[0-9]+}}(%esp), %ecx +; X32-NEXT: movzwl {{[0-9]+}}(%esp), %eax +; X32-NEXT: .p2align 4, 0x90 +; X32-NEXT: .LBB4_1: # %bb +; X32-NEXT: # =>This Inner Loop Header: Depth=1 +; X32-NEXT: xorl %ecx, %eax +; X32-NEXT: movl %eax, %edx +; X32-NEXT: notl %edx +; X32-NEXT: andl %ecx, %edx +; X32-NEXT: addl %edx, %edx +; X32-NEXT: testw %dx, %dx +; X32-NEXT: movl %edx, %ecx +; X32-NEXT: jne .LBB4_1 +; X32-NEXT: # %bb.2: # %bb12 +; X32-NEXT: # kill: def $ax killed $ax killed $eax +; X32-NEXT: retl +; +; X64-LIN-LABEL: test5: +; X64-LIN: # %bb.0: # %entry +; X64-LIN-NEXT: .p2align 4, 0x90 +; X64-LIN-NEXT: .LBB4_1: # %bb +; X64-LIN-NEXT: # =>This Inner Loop Header: Depth=1 +; X64-LIN-NEXT: xorl %esi, %edi +; X64-LIN-NEXT: movl %edi, %eax +; X64-LIN-NEXT: notl %eax +; X64-LIN-NEXT: andl %esi, %eax +; X64-LIN-NEXT: addl %eax, %eax +; X64-LIN-NEXT: testw %ax, %ax +; X64-LIN-NEXT: movl %eax, %esi +; X64-LIN-NEXT: jne .LBB4_1 +; X64-LIN-NEXT: # %bb.2: # %bb12 +; X64-LIN-NEXT: movl %edi, %eax +; X64-LIN-NEXT: retq +; +; X64-WIN-LABEL: test5: +; X64-WIN: # %bb.0: # %entry +; X64-WIN-NEXT: .p2align 4, 0x90 +; X64-WIN-NEXT: .LBB4_1: # %bb +; X64-WIN-NEXT: # =>This Inner Loop Header: Depth=1 +; X64-WIN-NEXT: xorl %edx, %ecx +; X64-WIN-NEXT: movl %ecx, %eax +; X64-WIN-NEXT: notl %eax +; X64-WIN-NEXT: andl %edx, %eax +; X64-WIN-NEXT: addl %eax, %eax +; X64-WIN-NEXT: testw %ax, %ax +; X64-WIN-NEXT: movl %eax, %edx +; X64-WIN-NEXT: jne .LBB4_1 +; X64-WIN-NEXT: # %bb.2: # %bb12 +; X64-WIN-NEXT: movl %ecx, %eax +; X64-WIN-NEXT: retq entry: - br label %bb + br label %bb bb: - %b_addr.0 = phi i16 [ %b, %entry ], [ %tmp8, %bb ] - %a_addr.0 = phi i16 [ %a, %entry ], [ %tmp3, %bb ] - %tmp3 = xor i16 %a_addr.0, %b_addr.0 - %tmp4not = xor i16 %tmp3, 32767 - %tmp6 = and i16 %tmp4not, %b_addr.0 - %tmp8 = shl i16 %tmp6, 1 - %tmp10 = icmp eq i16 %tmp8, 0 - br i1 %tmp10, label %bb12, label %bb + %b_addr.0 = phi i16 [ %b, %entry ], [ %tmp8, %bb ] + %a_addr.0 = phi i16 [ %a, %entry ], [ %tmp3, %bb ] + %tmp3 = xor i16 %a_addr.0, %b_addr.0 + %tmp4not = xor i16 %tmp3, 32767 + %tmp6 = and i16 %tmp4not, %b_addr.0 + %tmp8 = shl i16 %tmp6, 1 + %tmp10 = icmp eq i16 %tmp8, 0 + br i1 %tmp10, label %bb12, label %bb bb12: - ret i16 %tmp3 -; X64-LABEL: test5: -; X64: notl [[REG:%[a-z]+]] -; X64: andl {{.*}}[[REG]] -; X32-LABEL: test5: -; X32: notl [[REG:%[a-z]+]] -; X32: andl {{.*}}[[REG]] + ret i16 %tmp3 } define i8 @test6(i8 %a, i8 %b) nounwind { +; X32-LABEL: test6: +; X32: # %bb.0: # %entry +; X32-NEXT: movb {{[0-9]+}}(%esp), %cl +; X32-NEXT: movb {{[0-9]+}}(%esp), %al +; X32-NEXT: .p2align 4, 0x90 +; X32-NEXT: .LBB5_1: # %bb +; X32-NEXT: # =>This Inner Loop Header: Depth=1 +; X32-NEXT: xorb %cl, %al +; X32-NEXT: movl %eax, %edx +; X32-NEXT: notb %dl +; X32-NEXT: andb %cl, %dl +; X32-NEXT: addb %dl, %dl +; X32-NEXT: movl %edx, %ecx +; X32-NEXT: jne .LBB5_1 +; X32-NEXT: # %bb.2: # %bb12 +; X32-NEXT: retl +; +; X64-LIN-LABEL: test6: +; X64-LIN: # %bb.0: # %entry +; X64-LIN-NEXT: .p2align 4, 0x90 +; X64-LIN-NEXT: .LBB5_1: # %bb +; X64-LIN-NEXT: # =>This Inner Loop Header: Depth=1 +; X64-LIN-NEXT: xorb %sil, %dil +; X64-LIN-NEXT: movl %edi, %eax +; X64-LIN-NEXT: notb %al +; X64-LIN-NEXT: andb %sil, %al +; X64-LIN-NEXT: addb %al, %al +; X64-LIN-NEXT: movl %eax, %esi +; X64-LIN-NEXT: jne .LBB5_1 +; X64-LIN-NEXT: # %bb.2: # %bb12 +; X64-LIN-NEXT: movl %edi, %eax +; X64-LIN-NEXT: retq +; +; X64-WIN-LABEL: test6: +; X64-WIN: # %bb.0: # %entry +; X64-WIN-NEXT: .p2align 4, 0x90 +; X64-WIN-NEXT: .LBB5_1: # %bb +; X64-WIN-NEXT: # =>This Inner Loop Header: Depth=1 +; X64-WIN-NEXT: xorb %dl, %cl +; X64-WIN-NEXT: movl %ecx, %eax +; X64-WIN-NEXT: notb %al +; X64-WIN-NEXT: andb %dl, %al +; X64-WIN-NEXT: addb %al, %al +; X64-WIN-NEXT: movl %eax, %edx +; X64-WIN-NEXT: jne .LBB5_1 +; X64-WIN-NEXT: # %bb.2: # %bb12 +; X64-WIN-NEXT: movl %ecx, %eax +; X64-WIN-NEXT: retq entry: - br label %bb + br label %bb bb: - %b_addr.0 = phi i8 [ %b, %entry ], [ %tmp8, %bb ] - %a_addr.0 = phi i8 [ %a, %entry ], [ %tmp3, %bb ] - %tmp3 = xor i8 %a_addr.0, %b_addr.0 - %tmp4not = xor i8 %tmp3, 127 - %tmp6 = and i8 %tmp4not, %b_addr.0 - %tmp8 = shl i8 %tmp6, 1 - %tmp10 = icmp eq i8 %tmp8, 0 - br i1 %tmp10, label %bb12, label %bb + %b_addr.0 = phi i8 [ %b, %entry ], [ %tmp8, %bb ] + %a_addr.0 = phi i8 [ %a, %entry ], [ %tmp3, %bb ] + %tmp3 = xor i8 %a_addr.0, %b_addr.0 + %tmp4not = xor i8 %tmp3, 127 + %tmp6 = and i8 %tmp4not, %b_addr.0 + %tmp8 = shl i8 %tmp6, 1 + %tmp10 = icmp eq i8 %tmp8, 0 + br i1 %tmp10, label %bb12, label %bb bb12: - ret i8 %tmp3 -; X64-LABEL: test6: -; X64: notb [[REG:%[a-z]+]] -; X64: andb {{.*}}[[REG]] -; X32-LABEL: test6: -; X32: notb [[REG:%[a-z]+]] -; X32: andb {{.*}}[[REG]] + ret i8 %tmp3 } define i32 @test7(i32 %a, i32 %b) nounwind { +; X32-LABEL: test7: +; X32: # %bb.0: # %entry +; X32-NEXT: movl {{[0-9]+}}(%esp), %ecx +; X32-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-NEXT: .p2align 4, 0x90 +; X32-NEXT: .LBB6_1: # %bb +; X32-NEXT: # =>This Inner Loop Header: Depth=1 +; X32-NEXT: xorl %ecx, %eax +; X32-NEXT: movl %eax, %edx +; X32-NEXT: xorl $2147483646, %edx # imm = 0x7FFFFFFE +; X32-NEXT: andl %ecx, %edx +; X32-NEXT: addl %edx, %edx +; X32-NEXT: movl %edx, %ecx +; X32-NEXT: jne .LBB6_1 +; X32-NEXT: # %bb.2: # %bb12 +; X32-NEXT: retl +; +; X64-LIN-LABEL: test7: +; X64-LIN: # %bb.0: # %entry +; X64-LIN-NEXT: .p2align 4, 0x90 +; X64-LIN-NEXT: .LBB6_1: # %bb +; X64-LIN-NEXT: # =>This Inner Loop Header: Depth=1 +; X64-LIN-NEXT: xorl %esi, %edi +; X64-LIN-NEXT: movl %edi, %eax +; X64-LIN-NEXT: xorl $2147483646, %eax # imm = 0x7FFFFFFE +; X64-LIN-NEXT: andl %esi, %eax +; X64-LIN-NEXT: addl %eax, %eax +; X64-LIN-NEXT: movl %eax, %esi +; X64-LIN-NEXT: jne .LBB6_1 +; X64-LIN-NEXT: # %bb.2: # %bb12 +; X64-LIN-NEXT: movl %edi, %eax +; X64-LIN-NEXT: retq +; +; X64-WIN-LABEL: test7: +; X64-WIN: # %bb.0: # %entry +; X64-WIN-NEXT: .p2align 4, 0x90 +; X64-WIN-NEXT: .LBB6_1: # %bb +; X64-WIN-NEXT: # =>This Inner Loop Header: Depth=1 +; X64-WIN-NEXT: xorl %edx, %ecx +; X64-WIN-NEXT: movl %ecx, %eax +; X64-WIN-NEXT: xorl $2147483646, %eax # imm = 0x7FFFFFFE +; X64-WIN-NEXT: andl %edx, %eax +; X64-WIN-NEXT: addl %eax, %eax +; X64-WIN-NEXT: movl %eax, %edx +; X64-WIN-NEXT: jne .LBB6_1 +; X64-WIN-NEXT: # %bb.2: # %bb12 +; X64-WIN-NEXT: movl %ecx, %eax +; X64-WIN-NEXT: retq entry: - br label %bb + br label %bb bb: - %b_addr.0 = phi i32 [ %b, %entry ], [ %tmp8, %bb ] - %a_addr.0 = phi i32 [ %a, %entry ], [ %tmp3, %bb ] - %tmp3 = xor i32 %a_addr.0, %b_addr.0 - %tmp4not = xor i32 %tmp3, 2147483646 - %tmp6 = and i32 %tmp4not, %b_addr.0 - %tmp8 = shl i32 %tmp6, 1 - %tmp10 = icmp eq i32 %tmp8, 0 - br i1 %tmp10, label %bb12, label %bb + %b_addr.0 = phi i32 [ %b, %entry ], [ %tmp8, %bb ] + %a_addr.0 = phi i32 [ %a, %entry ], [ %tmp3, %bb ] + %tmp3 = xor i32 %a_addr.0, %b_addr.0 + %tmp4not = xor i32 %tmp3, 2147483646 + %tmp6 = and i32 %tmp4not, %b_addr.0 + %tmp8 = shl i32 %tmp6, 1 + %tmp10 = icmp eq i32 %tmp8, 0 + br i1 %tmp10, label %bb12, label %bb bb12: - ret i32 %tmp3 -; X64-LABEL: test7: -; X64: xorl $2147483646, [[REG:%[a-z]+]] -; X64: andl {{.*}}[[REG]] -; X32-LABEL: test7: -; X32: xorl $2147483646, [[REG:%[a-z]+]] -; X32: andl {{.*}}[[REG]] + ret i32 %tmp3 } -define i32 @test8(i32 %a) nounwind { ; rdar://7553032 +define i32 @test8(i32 %a) nounwind { +; X32-LABEL: test8: +; X32: # %bb.0: # %entry +; X32-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-NEXT: notl %eax +; X32-NEXT: retl +; +; X64-LIN-LABEL: test8: +; X64-LIN: # %bb.0: # %entry +; X64-LIN-NEXT: notl %edi +; X64-LIN-NEXT: movl %edi, %eax +; X64-LIN-NEXT: retq +; +; X64-WIN-LABEL: test8: +; X64-WIN: # %bb.0: # %entry +; X64-WIN-NEXT: notl %ecx +; X64-WIN-NEXT: movl %ecx, %eax +; X64-WIN-NEXT: retq entry: %t1 = sub i32 0, %a %t2 = add i32 %t1, -1 ret i32 %t2 -; X64-LABEL: test8: -; X64: notl {{%eax|%edi|%ecx}} -; X32-LABEL: test8: -; X32: notl %eax } define i32 @test9(i32 %a) nounwind { +; X32-LABEL: test9: +; X32: # %bb.0: +; X32-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-NEXT: notl %eax +; X32-NEXT: andl $4096, %eax # imm = 0x1000 +; X32-NEXT: retl +; +; X64-LIN-LABEL: test9: +; X64-LIN: # %bb.0: +; X64-LIN-NEXT: notl %edi +; X64-LIN-NEXT: andl $4096, %edi # imm = 0x1000 +; X64-LIN-NEXT: movl %edi, %eax +; X64-LIN-NEXT: retq +; +; X64-WIN-LABEL: test9: +; X64-WIN: # %bb.0: +; X64-WIN-NEXT: notl %ecx +; X64-WIN-NEXT: andl $4096, %ecx # imm = 0x1000 +; X64-WIN-NEXT: movl %ecx, %eax +; X64-WIN-NEXT: retq %1 = and i32 %a, 4096 %2 = xor i32 %1, 4096 ret i32 %2 -; X64-LABEL: test9: -; X64: notl [[REG:%[a-z]+]] -; X64: andl {{.*}}[[REG:%[a-z]+]] -; X32-LABEL: test9: -; X32: notl [[REG:%[a-z]+]] -; X32: andl {{.*}}[[REG:%[a-z]+]] } ; PR15948 define <4 x i32> @test10(<4 x i32> %a) nounwind { +; X32-LABEL: test10: +; X32: # %bb.0: +; X32-NEXT: andnps {{\.LCPI.*}}, %xmm0 +; X32-NEXT: retl +; +; X64-LIN-LABEL: test10: +; X64-LIN: # %bb.0: +; X64-LIN-NEXT: andnps {{.*}}(%rip), %xmm0 +; X64-LIN-NEXT: retq +; +; X64-WIN-LABEL: test10: +; X64-WIN: # %bb.0: +; X64-WIN-NEXT: movaps (%rcx), %xmm0 +; X64-WIN-NEXT: andnps __xmm@{{.*}}(%rip), %xmm0 +; X64-WIN-NEXT: retq %1 = and <4 x i32> %a, <i32 4096, i32 4096, i32 4096, i32 4096> %2 = xor <4 x i32> %1, <i32 4096, i32 4096, i32 4096, i32 4096> ret <4 x i32> %2 -; X64-LABEL: test10: -; X64: andnps -; X32-LABEL: test10: -; X32: andnps } define i32 @PR17487(i1 %tobool) { +; X32-LABEL: PR17487: +; X32: # %bb.0: +; X32-NEXT: movd {{.*#+}} xmm0 = mem[0],zero,zero,zero +; X32-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,1,0,1] +; X32-NEXT: pandn {{\.LCPI.*}}, %xmm0 +; X32-NEXT: pshufd {{.*#+}} xmm1 = xmm0[3,1,2,3] +; X32-NEXT: movd %xmm1, %ecx +; X32-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] +; X32-NEXT: movd %xmm0, %edx +; X32-NEXT: xorl $1, %edx +; X32-NEXT: xorl %eax, %eax +; X32-NEXT: orl %ecx, %edx +; X32-NEXT: setne %al +; X32-NEXT: retl +; +; X64-LIN-LABEL: PR17487: +; X64-LIN: # %bb.0: +; X64-LIN-NEXT: movd %edi, %xmm0 +; X64-LIN-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,1,0,1] +; X64-LIN-NEXT: pandn {{.*}}(%rip), %xmm0 +; X64-LIN-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] +; X64-LIN-NEXT: movq %xmm0, %rcx +; X64-LIN-NEXT: xorl %eax, %eax +; X64-LIN-NEXT: cmpq $1, %rcx +; X64-LIN-NEXT: setne %al +; X64-LIN-NEXT: retq +; +; X64-WIN-LABEL: PR17487: +; X64-WIN: # %bb.0: +; X64-WIN-NEXT: movd %ecx, %xmm0 +; X64-WIN-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,1,0,1] +; X64-WIN-NEXT: pandn __xmm@{{.*}}(%rip), %xmm0 +; X64-WIN-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] +; X64-WIN-NEXT: movq %xmm0, %rcx +; X64-WIN-NEXT: xorl %eax, %eax +; X64-WIN-NEXT: cmpq $1, %rcx +; X64-WIN-NEXT: setne %al +; X64-WIN-NEXT: retq %tmp = insertelement <2 x i1> undef, i1 %tobool, i32 1 %tmp1 = zext <2 x i1> %tmp to <2 x i64> %tmp2 = xor <2 x i64> %tmp1, <i64 1, i64 1> @@ -175,40 +444,65 @@ define i32 @PR17487(i1 %tobool) { %cmp6 = icmp ne i64 %add, 1 %conv7 = zext i1 %cmp6 to i32 ret i32 %conv7 - -; X64-LABEL: PR17487: -; X64: andn -; X32-LABEL: PR17487: -; X32: andn } define i32 @test11(i32 %b) { +; X32-LABEL: test11: +; X32: # %bb.0: +; X32-NEXT: movb {{[0-9]+}}(%esp), %cl +; X32-NEXT: movl $-2, %eax +; X32-NEXT: roll %cl, %eax +; X32-NEXT: retl +; +; X64-LIN-LABEL: test11: +; X64-LIN: # %bb.0: +; X64-LIN-NEXT: movl $-2, %eax +; X64-LIN-NEXT: movl %edi, %ecx +; X64-LIN-NEXT: roll %cl, %eax +; X64-LIN-NEXT: retq +; +; X64-WIN-LABEL: test11: +; X64-WIN: # %bb.0: +; X64-WIN-NEXT: movl $-2, %eax +; X64-WIN-NEXT: # kill: def $cl killed $cl killed $ecx +; X64-WIN-NEXT: roll %cl, %eax +; X64-WIN-NEXT: retq %shl = shl i32 1, %b %neg = xor i32 %shl, -1 ret i32 %neg -; X64-LABEL: test11: -; X64: movl $-2, %[[REG:.*]] -; X64: roll %{{.*}}, %[[REG]] -; X32-LABEL: test11: -; X32: movl $-2, %[[REG:.*]] -; X32: roll %{{.*}}, %[[REG]] } %struct.ref_s = type { %union.v, i16, i16 } %union.v = type { i64 } define %struct.ref_s* @test12(%struct.ref_s* %op, i64 %osbot, i64 %intval) { +; X32-LABEL: test12: +; X32: # %bb.0: +; X32-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-NEXT: notl %eax +; X32-NEXT: leal (%eax,%eax,2), %eax +; X32-NEXT: shll $2, %eax +; X32-NEXT: addl {{[0-9]+}}(%esp), %eax +; X32-NEXT: retl +; +; X64-LIN-LABEL: test12: +; X64-LIN: # %bb.0: +; X64-LIN-NEXT: xorq $-1, %rdx +; X64-LIN-NEXT: shlq $32, %rdx +; X64-LIN-NEXT: sarq $28, %rdx +; X64-LIN-NEXT: leaq (%rdx,%rdi), %rax +; X64-LIN-NEXT: retq +; +; X64-WIN-LABEL: test12: +; X64-WIN: # %bb.0: +; X64-WIN-NEXT: xorq $-1, %r8 +; X64-WIN-NEXT: shlq $32, %r8 +; X64-WIN-NEXT: sarq $28, %r8 +; X64-WIN-NEXT: leaq (%r8,%rcx), %rax +; X64-WIN-NEXT: retq %neg = shl i64 %intval, 32 %sext = xor i64 %neg, -4294967296 %idx.ext = ashr exact i64 %sext, 32 %add.ptr = getelementptr inbounds %struct.ref_s, %struct.ref_s* %op, i64 %idx.ext ret %struct.ref_s* %add.ptr -; X64-LABEL: test12: -; X64: shlq $32, %[[REG:.*]] -; X64-NOT: not -; X64: sarq $28, %[[REG]] -; X32-LABEL: test12: -; X32: leal -; X32-NOT: not -; X32: shll $2, %eax } |