[X86] Turn setne X, signedmax into setgt signedmax, X in LowerVSETCC to avoid an invert

We won't be able to fold the constant pool load, but its still better than materialing ones and xoring for the invert if we used PCMPEQ. This will fix another regression from D42948. llvm-svn: 325845
author: Craig Topper <craig.topper@intel.com> 2018-02-23 00:21:39 +0000
committer: Craig Topper <craig.topper@intel.com> 2018-02-23 00:21:39 +0000
commit: 0dcc88a500e120f50716e6d3efc2a9cf5db6d570 (patch)
tree: 50fc0dce662763e9f233d2b5198db23e9c7c3bfc /llvm/test
parent: 5c986b010b118ccd6dcb0a0eba5579d961e1ec67 (diff)
download: bcm5719-llvm-0dcc88a500e120f50716e6d3efc2a9cf5db6d570.tar.gz
bcm5719-llvm-0dcc88a500e120f50716e6d3efc2a9cf5db6d570.zip
1 files changed, 15 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/X86/vector-compare-simplify.ll b/llvm/test/CodeGen/X86/vector-compare-simplify.ll
index f1ac60134eb..e7f1d849b2f 100644
--- a/llvm/test/CodeGen/X86/vector-compare-simplify.ll
+++ b/llvm/test/CodeGen/X86/vector-compare-simplify.ll
@@ -345,3 +345,18 @@ define <4 x i32> @ne_smin(<4 x i32> %x) {
   ret <4 x i32> %r
 }
 
+; Make sure we can efficiently handle ne smax by turning into sgt. We can't fold
+; the constant pool load, but the alternative is a cmpeq+invert which is 3 instructions.
+; The PCMPGT version is two instructions given sufficient register allocation freedom
+; to avoid the last mov to %xmm0 seen here.
+define <4 x i32> @ne_smax(<4 x i32> %x) {
+; CHECK-LABEL: ne_smax:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    movdqa {{.*#+}} xmm1 = [2147483647,2147483647,2147483647,2147483647]
+; CHECK-NEXT:    pcmpgtd %xmm0, %xmm1
+; CHECK-NEXT:    movdqa %xmm1, %xmm0
+; CHECK-NEXT:    retq
+  %cmp = icmp ne <4 x i32> %x, <i32 2147483647, i32 2147483647, i32 2147483647, i32 2147483647>
+  %r = sext <4 x i1> %cmp to <4 x i32>
+  ret <4 x i32> %r
+}
author	Craig Topper <craig.topper@intel.com>	2018-02-23 00:21:39 +0000
committer	Craig Topper <craig.topper@intel.com>	2018-02-23 00:21:39 +0000
commit	0dcc88a500e120f50716e6d3efc2a9cf5db6d570 (patch)
tree	50fc0dce662763e9f233d2b5198db23e9c7c3bfc /llvm/test
parent	5c986b010b118ccd6dcb0a0eba5579d961e1ec67 (diff)
download	bcm5719-llvm-0dcc88a500e120f50716e6d3efc2a9cf5db6d570.tar.gz bcm5719-llvm-0dcc88a500e120f50716e6d3efc2a9cf5db6d570.zip