diff options
author | Sanjoy Das <sanjoy@playingwithpointers.com> | 2016-07-14 19:21:15 +0000 |
---|---|---|
committer | Sanjoy Das <sanjoy@playingwithpointers.com> | 2016-07-14 19:21:15 +0000 |
commit | 13623ad009ba13f7179900a7cfd5370eb85f692f (patch) | |
tree | 5c1203ee7549dde3c777ef67b3ee46fd5d5899b9 | |
parent | 31ceba7c447d21661650bb4f44a21f9da574add2 (diff) | |
download | bcm5719-llvm-13623ad009ba13f7179900a7cfd5370eb85f692f.tar.gz bcm5719-llvm-13623ad009ba13f7179900a7cfd5370eb85f692f.zip |
[JumpThreading] PRE unordered loads
Summary: Extend JumpThreading's PRE to unordered atomic loads.
Reviewers: hfinkel, reames
Subscribers: mcrosier, llvm-commits
Differential Revision: http://reviews.llvm.org/D22326
llvm-svn: 275456
-rw-r--r-- | llvm/lib/Transforms/Scalar/JumpThreading.cpp | 11 | ||||
-rw-r--r-- | llvm/test/Transforms/JumpThreading/thread-loads.ll | 139 |
2 files changed, 145 insertions, 5 deletions
diff --git a/llvm/lib/Transforms/Scalar/JumpThreading.cpp b/llvm/lib/Transforms/Scalar/JumpThreading.cpp index de1d7d50384..b9e717cf763 100644 --- a/llvm/lib/Transforms/Scalar/JumpThreading.cpp +++ b/llvm/lib/Transforms/Scalar/JumpThreading.cpp @@ -924,8 +924,8 @@ bool JumpThreadingPass::ProcessImpliedCondition(BasicBlock *BB) { /// important optimization that encourages jump threading, and needs to be run /// interlaced with other jump threading tasks. bool JumpThreadingPass::SimplifyPartiallyRedundantLoad(LoadInst *LI) { - // Don't hack volatile/atomic loads. - if (!LI->isSimple()) return false; + // Don't hack volatile and ordered loads. + if (!LI->isUnordered()) return false; // If the load is defined in a block with exactly one predecessor, it can't be // partially redundant. @@ -1055,9 +1055,10 @@ bool JumpThreadingPass::SimplifyPartiallyRedundantLoad(LoadInst *LI) { if (UnavailablePred) { assert(UnavailablePred->getTerminator()->getNumSuccessors() == 1 && "Can't handle critical edge here!"); - LoadInst *NewVal = new LoadInst(LoadedPtr, LI->getName()+".pr", false, - LI->getAlignment(), - UnavailablePred->getTerminator()); + LoadInst *NewVal = + new LoadInst(LoadedPtr, LI->getName() + ".pr", false, + LI->getAlignment(), LI->getOrdering(), LI->getSynchScope(), + UnavailablePred->getTerminator()); NewVal->setDebugLoc(LI->getDebugLoc()); if (AATags) NewVal->setAAMetadata(AATags); diff --git a/llvm/test/Transforms/JumpThreading/thread-loads.ll b/llvm/test/Transforms/JumpThreading/thread-loads.ll index 0981e1940dc..4b482cb15f9 100644 --- a/llvm/test/Transforms/JumpThreading/thread-loads.ll +++ b/llvm/test/Transforms/JumpThreading/thread-loads.ll @@ -107,6 +107,145 @@ return: ret i32 13 } +define i32 @test4(i32* %P) { +; CHECK-LABEL: @test4( +entry: + %v0 = tail call i32 (...) @f1() + %v1 = icmp eq i32 %v0, 0 + br i1 %v1, label %bb1, label %bb + +bb: +; CHECK: bb1.thread: +; CHECK: store atomic +; CHECK: br label %bb3 + store atomic i32 42, i32* %P unordered, align 4 + br label %bb1 + +bb1: +; CHECK: bb1: +; CHECK-NOT: phi +; CHECK: load atomic + %res.0 = phi i32 [ 1, %bb ], [ 0, %entry ] + %v2 = load atomic i32, i32* %P unordered, align 4 + %v3 = icmp sgt i32 %v2, 36 + br i1 %v3, label %bb3, label %bb2 + +bb2: + %v4 = tail call i32 (...) @f2() + ret i32 %res.0 + +bb3: + ret i32 %res.0 +} + +define i32 @test5(i32* %P) { +; Negative test + +; CHECK-LABEL: @test5( +entry: + %v0 = tail call i32 (...) @f1() + %v1 = icmp eq i32 %v0, 0 + br i1 %v1, label %bb1, label %bb + +bb: +; CHECK: bb: +; CHECK-NEXT: store atomic i32 42, i32* %P release, align 4 +; CHECK-NEXT: br label %bb1 + store atomic i32 42, i32* %P release, align 4 + br label %bb1 + +bb1: +; CHECK: bb1: +; CHECK-NEXT: %res.0 = phi i32 [ 1, %bb ], [ 0, %entry ] +; CHECK-NEXT: %v2 = load atomic i32, i32* %P acquire, align 4 +; CHECK-NEXT: %v3 = icmp sgt i32 %v2, 36 +; CHECK-NEXT: br i1 %v3, label %bb3, label %bb2 + + %res.0 = phi i32 [ 1, %bb ], [ 0, %entry ] + %v2 = load atomic i32, i32* %P acquire, align 4 + %v3 = icmp sgt i32 %v2, 36 + br i1 %v3, label %bb3, label %bb2 + +bb2: + %v4 = tail call i32 (...) @f2() + ret i32 %res.0 + +bb3: + ret i32 %res.0 +} + +define i32 @test6(i32* %P) { +; Negative test + +; CHECK-LABEL: @test6( +entry: + %v0 = tail call i32 (...) @f1() + %v1 = icmp eq i32 %v0, 0 + br i1 %v1, label %bb1, label %bb + +bb: +; CHECK: bb: +; CHECK-NEXT: store i32 42, i32* %P +; CHECK-NEXT: br label %bb1 + store i32 42, i32* %P + br label %bb1 + +bb1: +; CHECK: bb1: +; CHECK-NEXT: %res.0 = phi i32 [ 1, %bb ], [ 0, %entry ] +; CHECK-NEXT: %v2 = load atomic i32, i32* %P acquire, align 4 +; CHECK-NEXT: %v3 = icmp sgt i32 %v2, 36 +; CHECK-NEXT: br i1 %v3, label %bb3, label %bb2 + + %res.0 = phi i32 [ 1, %bb ], [ 0, %entry ] + %v2 = load atomic i32, i32* %P acquire, align 4 + %v3 = icmp sgt i32 %v2, 36 + br i1 %v3, label %bb3, label %bb2 + +bb2: + %v4 = tail call i32 (...) @f2() + ret i32 %res.0 + +bb3: + ret i32 %res.0 +} + +define i32 @test7(i32* %P) { +; Negative test + +; CHECK-LABEL: @test7( +entry: + %v0 = tail call i32 (...) @f1() + %v1 = icmp eq i32 %v0, 0 + br i1 %v1, label %bb1, label %bb + +bb: +; CHECK: bb: +; CHECK-NEXT: %val = load i32, i32* %P +; CHECK-NEXT: br label %bb1 + %val = load i32, i32* %P + br label %bb1 + +bb1: +; CHECK: bb1: +; CHECK-NEXT: %res.0 = phi i32 [ 1, %bb ], [ 0, %entry ] +; CHECK-NEXT: %v2 = load atomic i32, i32* %P acquire, align 4 +; CHECK-NEXT: %v3 = icmp sgt i32 %v2, 36 +; CHECK-NEXT: br i1 %v3, label %bb3, label %bb2 + + %res.0 = phi i32 [ 1, %bb ], [ 0, %entry ] + %v2 = load atomic i32, i32* %P acquire, align 4 + %v3 = icmp sgt i32 %v2, 36 + br i1 %v3, label %bb3, label %bb2 + +bb2: + %v4 = tail call i32 (...) @f2() + ret i32 %res.0 + +bb3: + ret i32 %res.0 +} + !0 = !{!3, !3, i64 0} !1 = !{!"omnipotent char", !2} !2 = !{!"Simple C/C++ TBAA", null} |