summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--llvm/lib/Analysis/ScalarEvolution.cpp12
-rw-r--r--llvm/test/Analysis/ScalarEvolution/zext-mul.ll31
2 files changed, 43 insertions, 0 deletions
diff --git a/llvm/lib/Analysis/ScalarEvolution.cpp b/llvm/lib/Analysis/ScalarEvolution.cpp
index dee35392692..08d5eff100f 100644
--- a/llvm/lib/Analysis/ScalarEvolution.cpp
+++ b/llvm/lib/Analysis/ScalarEvolution.cpp
@@ -1778,6 +1778,18 @@ ScalarEvolution::getZeroExtendExpr(const SCEV *Op, Type *Ty, unsigned Depth) {
}
}
+ if (auto *SA = dyn_cast<SCEVMulExpr>(Op)) {
+ // zext((A * B * ...)<nuw>) --> (zext(A) * zext(B) * ...)<nuw>
+ if (SA->hasNoUnsignedWrap()) {
+ // If the multiply does not unsign overflow then we can, by definition,
+ // commute the zero extension with the multiply operation.
+ SmallVector<const SCEV *, 4> Ops;
+ for (const auto *Op : SA->operands())
+ Ops.push_back(getZeroExtendExpr(Op, Ty, Depth + 1));
+ return getMulExpr(Ops, SCEV::FlagNUW, Depth + 1);
+ }
+ }
+
// The cast wasn't folded; create an explicit cast node.
// Recompute the insert position, as it may have been invalidated.
if (const SCEV *S = UniqueSCEVs.FindNodeOrInsertPos(ID, IP)) return S;
diff --git a/llvm/test/Analysis/ScalarEvolution/zext-mul.ll b/llvm/test/Analysis/ScalarEvolution/zext-mul.ll
new file mode 100644
index 00000000000..5206613c8f2
--- /dev/null
+++ b/llvm/test/Analysis/ScalarEvolution/zext-mul.ll
@@ -0,0 +1,31 @@
+; RUN: opt < %s -analyze -scalar-evolution | FileCheck %s
+
+; Check that we convert
+; zext((a * b)<nuw>)
+; to
+; (zext(a) * zext(b))<nuw>
+
+declare i32 @get_int();
+
+; Transform doesn't apply here, because %a lacks range metadata.
+; CHECK-LABEL: @no_range
+define void @no_range() {
+ %a = call i32 @get_int()
+ %b = mul i32 %a, 4
+ %c = zext i32 %b to i64
+ ; CHECK: %c
+ ; CHECK-NEXT: --> (zext i32 (4 * %a) to i64)
+ ret void
+}
+
+; CHECK-LABEL: @range
+define void @range() {
+ %a = call i32 @get_int(), !range !0
+ %b = mul i32 %a, 4
+ %c = zext i32 %b to i64
+ ; CHECK: %c
+ ; CHECK-NEXT: --> (4 * (zext i32 %a to i64))<nuw>
+ ret void
+}
+
+!0 = !{i32 0, i32 100}
OpenPOWER on IntegriCloud