diff options
| -rw-r--r-- | llvm/lib/Analysis/ScalarEvolution.cpp | 12 | ||||
| -rw-r--r-- | llvm/test/Analysis/ScalarEvolution/zext-mul.ll | 31 |
2 files changed, 43 insertions, 0 deletions
diff --git a/llvm/lib/Analysis/ScalarEvolution.cpp b/llvm/lib/Analysis/ScalarEvolution.cpp index dee35392692..08d5eff100f 100644 --- a/llvm/lib/Analysis/ScalarEvolution.cpp +++ b/llvm/lib/Analysis/ScalarEvolution.cpp @@ -1778,6 +1778,18 @@ ScalarEvolution::getZeroExtendExpr(const SCEV *Op, Type *Ty, unsigned Depth) { } } + if (auto *SA = dyn_cast<SCEVMulExpr>(Op)) { + // zext((A * B * ...)<nuw>) --> (zext(A) * zext(B) * ...)<nuw> + if (SA->hasNoUnsignedWrap()) { + // If the multiply does not unsign overflow then we can, by definition, + // commute the zero extension with the multiply operation. + SmallVector<const SCEV *, 4> Ops; + for (const auto *Op : SA->operands()) + Ops.push_back(getZeroExtendExpr(Op, Ty, Depth + 1)); + return getMulExpr(Ops, SCEV::FlagNUW, Depth + 1); + } + } + // The cast wasn't folded; create an explicit cast node. // Recompute the insert position, as it may have been invalidated. if (const SCEV *S = UniqueSCEVs.FindNodeOrInsertPos(ID, IP)) return S; diff --git a/llvm/test/Analysis/ScalarEvolution/zext-mul.ll b/llvm/test/Analysis/ScalarEvolution/zext-mul.ll new file mode 100644 index 00000000000..5206613c8f2 --- /dev/null +++ b/llvm/test/Analysis/ScalarEvolution/zext-mul.ll @@ -0,0 +1,31 @@ +; RUN: opt < %s -analyze -scalar-evolution | FileCheck %s + +; Check that we convert +; zext((a * b)<nuw>) +; to +; (zext(a) * zext(b))<nuw> + +declare i32 @get_int(); + +; Transform doesn't apply here, because %a lacks range metadata. +; CHECK-LABEL: @no_range +define void @no_range() { + %a = call i32 @get_int() + %b = mul i32 %a, 4 + %c = zext i32 %b to i64 + ; CHECK: %c + ; CHECK-NEXT: --> (zext i32 (4 * %a) to i64) + ret void +} + +; CHECK-LABEL: @range +define void @range() { + %a = call i32 @get_int(), !range !0 + %b = mul i32 %a, 4 + %c = zext i32 %b to i64 + ; CHECK: %c + ; CHECK-NEXT: --> (4 * (zext i32 %a to i64))<nuw> + ret void +} + +!0 = !{i32 0, i32 100} |

