[InstCombine] move add after umin/umax

In the motivating cases from PR14613: https://bugs.llvm.org/show_bug.cgi?id=14613 ...moving the add enables us to narrow the min/max which eliminates zext/trunc which enables signficantly better vectorization. But that bug is still not completely fixed. https://rise4fun.com/Alive/5KQ Name: umax Pre: C1 u>= C0 %a = add nuw i8 %x, C0 %cond = icmp ugt i8 %a, C1 %r = select i1 %cond, i8 %a, i8 C1 => %c2 = icmp ugt i8 %x, C1-C0 %u2 = select i1 %c2, i8 %x, i8 C1-C0 %r = add nuw i8 %u2, C0 Name: umin Pre: C1 u>= C0 %a = add nuw i32 %x, C0 %cond = icmp ult i32 %a, C1 %r = select i1 %cond, i32 %a, i32 C1 => %c2 = icmp ult i32 %x, C1-C0 %u2 = select i1 %c2, i32 %x, i32 C1-C0 %r = add nuw i32 %u2, C0 llvm-svn: 355221
author: Sanjay Patel <spatel@rotateright.com> 2019-03-01 19:42:40 +0000
committer: Sanjay Patel <spatel@rotateright.com> 2019-03-01 19:42:40 +0000
commit: 6e1e7e1c3ecc66db573ebd85c5d9570e0665b248 (patch)
tree: ed2148503bb488a1b068f151f1673da4c18fadd0 /llvm/lib/Transforms
parent: 20292a0526869b45e72f58bec272dd9b68f4aa4a (diff)
download: bcm5719-llvm-6e1e7e1c3ecc66db573ebd85c5d9570e0665b248.tar.gz
bcm5719-llvm-6e1e7e1c3ecc66db573ebd85c5d9570e0665b248.zip
1 files changed, 27 insertions, 0 deletions
diff --git a/llvm/lib/Transforms/InstCombine/InstCombineSelect.cpp b/llvm/lib/Transforms/InstCombine/InstCombineSelect.cpp
index 79835ef9316..b39a4648579 100644
--- a/llvm/lib/Transforms/InstCombine/InstCombineSelect.cpp
+++ b/llvm/lib/Transforms/InstCombine/InstCombineSelect.cpp
@@ -1563,6 +1563,30 @@ static Instruction *foldSelectCmpXchg(SelectInst &SI) {
   return nullptr;
 }
 
+static Instruction *moveAddAfterMinMax(SelectPatternFlavor SPF, Value *X,
+                                       Value *Y,
+                                       InstCombiner::BuilderTy &Builder) {
+  assert (SelectPatternResult::isMinOrMax(SPF) && "Expected min/max pattern");
+  bool IsUnsigned = SPF == SelectPatternFlavor::SPF_UMIN ||
+                    SPF == SelectPatternFlavor::SPF_UMAX;
+  // TODO: If InstSimplify could fold all cases where C2 <= C1, we could change
+  // the constant value check to an assert.
+  Value *A;
+  const APInt *C1, *C2;
+  if (IsUnsigned && match(X, m_NUWAdd(m_Value(A), m_APInt(C1))) &&
+      match(Y, m_APInt(C2)) && C2->uge(*C1) && X->hasNUses(2)) {
+    // umin (add nuw A, C1), C2 --> add nuw (umin A, C2 - C1), C1
+    // umax (add nuw A, C1), C2 --> add nuw (umax A, C2 - C1), C1
+    Value *NewMinMax = createMinMax(Builder, SPF, A,
+                                    ConstantInt::get(X->getType(), *C2 - *C1));
+    return BinaryOperator::CreateNUW(BinaryOperator::Add, NewMinMax,
+                                     ConstantInt::get(X->getType(), *C1));
+  }
+  // TODO: Handle SMIN/SMAX (similar to unsigned, but the signed subtraction of
+  // the constants must not overflow).
+  return nullptr;
+}
+
 /// Reduce a sequence of min/max with a common operand.
 static Instruction *factorizeMinMaxTree(SelectPatternFlavor SPF, Value *LHS,
                                         Value *RHS,
@@ -1962,6 +1986,9 @@ Instruction *InstCombiner::visitSelectInst(SelectInst &SI) {
       if (Instruction *I = moveNotAfterMinMax(RHS, LHS))
         return I;
 
+      if (Instruction *I = moveAddAfterMinMax(SPF, LHS, RHS, Builder))
+        return I;
+
       if (Instruction *I = factorizeMinMaxTree(SPF, LHS, RHS, Builder))
         return I;
     }
author	Sanjay Patel <spatel@rotateright.com>	2019-03-01 19:42:40 +0000
committer	Sanjay Patel <spatel@rotateright.com>	2019-03-01 19:42:40 +0000
commit	6e1e7e1c3ecc66db573ebd85c5d9570e0665b248 (patch)
tree	ed2148503bb488a1b068f151f1673da4c18fadd0 /llvm/lib/Transforms
parent	20292a0526869b45e72f58bec272dd9b68f4aa4a (diff)
download	bcm5719-llvm-6e1e7e1c3ecc66db573ebd85c5d9570e0665b248.tar.gz bcm5719-llvm-6e1e7e1c3ecc66db573ebd85c5d9570e0665b248.zip