summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorJonas Paulsson <paulsson@linux.vnet.ibm.com>2017-04-12 13:29:25 +0000
committerJonas Paulsson <paulsson@linux.vnet.ibm.com>2017-04-12 13:29:25 +0000
commit22776892c9aad3cedd2f3692d324ff45af1b29fb (patch)
treea4613b602bdf1b5b5c21bc1176a3dfb17b61dd92
parent33580692f61e8c0cb540604f6b55abb7bd78df5f (diff)
downloadbcm5719-llvm-22776892c9aad3cedd2f3692d324ff45af1b29fb.tar.gz
bcm5719-llvm-22776892c9aad3cedd2f3692d324ff45af1b29fb.zip
[SLPVectorizer] Pass the right type argument to getCmpSelInstrCost()
In getEntryCost(), make the scalar type for a compare instruction that of the operands, not i1. This is needed in order to call getCmpSelInstrCost() for a compare in a sensible way, the same way as the LoopVectorizer does. New test: test/Transforms/SLPVectorizer/SystemZ/SLP-cmp-cost-query.ll Review: Matthew Simpson https://reviews.llvm.org/D31601 llvm-svn: 300061
-rw-r--r--llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp2
-rw-r--r--llvm/test/Transforms/SLPVectorizer/SystemZ/SLP-cmp-cost-query.ll36
2 files changed, 38 insertions, 0 deletions
diff --git a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
index df7dc2ac67f..da3ac06ab46 100644
--- a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
+++ b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp
@@ -1702,6 +1702,8 @@ int BoUpSLP::getEntryCost(TreeEntry *E) {
Type *ScalarTy = VL[0]->getType();
if (StoreInst *SI = dyn_cast<StoreInst>(VL[0]))
ScalarTy = SI->getValueOperand()->getType();
+ else if (CmpInst *CI = dyn_cast<CmpInst>(VL[0]))
+ ScalarTy = CI->getOperand(0)->getType();
VectorType *VecTy = VectorType::get(ScalarTy, VL.size());
// If we have computed a smaller type for the expression, update VecTy so
diff --git a/llvm/test/Transforms/SLPVectorizer/SystemZ/SLP-cmp-cost-query.ll b/llvm/test/Transforms/SLPVectorizer/SystemZ/SLP-cmp-cost-query.ll
new file mode 100644
index 00000000000..535003ae6f0
--- /dev/null
+++ b/llvm/test/Transforms/SLPVectorizer/SystemZ/SLP-cmp-cost-query.ll
@@ -0,0 +1,36 @@
+; REQUIRES: asserts
+; RUN: opt -mtriple=systemz-unknown -mcpu=z13 -slp-vectorizer -debug-only=SLP \
+; RUN: -S -disable-output < %s |& FileCheck %s
+;
+; Check that SLP vectorizer gets the right cost difference for a compare
+; node.
+
+; Function Attrs: norecurse nounwind readonly
+define void @fun(i8* nocapture, i32 zeroext) local_unnamed_addr #0 {
+.lr.ph.preheader:
+ br label %.lr.ph
+
+.lr.ph: ; preds = %.lr.ph.preheader, %.lr.ph
+ %2 = phi i32 [ %., %.lr.ph ], [ undef, %.lr.ph.preheader ]
+ %3 = phi i32 [ %.9, %.lr.ph ], [ undef, %.lr.ph.preheader ]
+ %4 = icmp ult i32 %2, %1
+ %5 = select i1 %4, i32 0, i32 %1
+ %. = sub i32 %2, %5
+ %6 = icmp ult i32 %3, %1
+ %7 = select i1 %6, i32 0, i32 %1
+ %.9 = sub i32 %3, %7
+ %8 = zext i32 %. to i64
+ %9 = getelementptr inbounds i8, i8* %0, i64 %8
+ %10 = load i8, i8* %9, align 1
+ %11 = zext i32 %.9 to i64
+ %12 = getelementptr inbounds i8, i8* %0, i64 %11
+ %13 = load i8, i8* %12, align 1
+ %14 = icmp eq i8 %10, %13
+ br i1 %14, label %.lr.ph, label %._crit_edge
+
+._crit_edge: ; preds = %.lr.ph
+ ret void
+
+; CHECK: SLP: Adding cost -1 for bundle that starts with %4 = icmp ult i32 %2, %1.
+}
+
OpenPOWER on IntegriCloud