summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorJohannes Doerfert <doerfert@cs.uni-saarland.de>2015-02-27 18:29:04 +0000
committerJohannes Doerfert <doerfert@cs.uni-saarland.de>2015-02-27 18:29:04 +0000
commit514f6efa2bd263d7483c796e9bc119dc84acf724 (patch)
treea1bf6a5aecf81f31bd07cdd5eee579496ceaf458
parent2e3d1e056c8dc2754b932a52a16bb0558f0e5e3d (diff)
downloadbcm5719-llvm-514f6efa2bd263d7483c796e9bc119dc84acf724.tar.gz
bcm5719-llvm-514f6efa2bd263d7483c796e9bc119dc84acf724.zip
[FIX] Teach RegionGenerator to respect and update dominance
When we generate code for a whole region we have to respect dominance and update it too. The first is achieved with multiple "BBMap"s. Each copied block in the region gets its own map. It is initialized only with values mapped in the immediate dominator block, if this block is in the region and was therefor already copied. This way no values defined in a block that doesn't dominate the current one will be used. To update dominance information we check if the immediate dominator of the original block we want to copy is in the region. If so we set the immediate dominator of the current block to the copy of the immediate dominator of the original block. llvm-svn: 230774
-rw-r--r--polly/include/polly/CodeGen/BlockGenerators.h24
-rw-r--r--polly/lib/CodeGen/BlockGenerators.cpp69
-rw-r--r--polly/test/Isl/CodeGen/non-affine-subregion-dominance-reuse.ll74
-rw-r--r--polly/test/Isl/CodeGen/non_affine_float_compare.ll8
4 files changed, 156 insertions, 19 deletions
diff --git a/polly/include/polly/CodeGen/BlockGenerators.h b/polly/include/polly/CodeGen/BlockGenerators.h
index 776105b5d6b..acd0c07c0d6 100644
--- a/polly/include/polly/CodeGen/BlockGenerators.h
+++ b/polly/include/polly/CodeGen/BlockGenerators.h
@@ -100,6 +100,9 @@ protected:
/// @brief The dominator tree of this function.
DominatorTree &DT;
+ /// @brief Split @p BB to create a new one we can use to clone @p BB in.
+ BasicBlock *splitBB(BasicBlock *BB);
+
/// @brief Copy the given basic block.
///
/// @param Stmt The statement to code generate.
@@ -115,6 +118,20 @@ protected:
BasicBlock *copyBB(ScopStmt &Stmt, BasicBlock *BB, ValueMapT &BBMap,
ValueMapT &GlobalMap, LoopToScevMapT &LTS);
+ /// @brief Copy the given basic block.
+ ///
+ /// @param Stmt The statement to code generate.
+ /// @param BB The basic block to code generate.
+ /// @param BBCopy The new basic block to generate code in.
+ /// @param BBMap A mapping from old values to their new values in this
+ /// block.
+ /// @param GlobalMap A mapping from old values to their new values
+ /// (for values recalculated in the new ScoP, but not
+ /// within this basic block).
+ /// @param LTS A map from old loops to new induction variables as SCEVs.
+ void copyBB(ScopStmt &Stmt, BasicBlock *BB, BasicBlock *BBCopy,
+ ValueMapT &BBMap, ValueMapT &GlobalMap, LoopToScevMapT &LTS);
+
/// @brief Get the new version of a value.
///
/// Given an old value, we first check if a new version of this value is
@@ -360,6 +377,13 @@ public:
/// within this basic block).
/// @param LTS A map from old loops to new induction variables as SCEVs.
void copyStmt(ScopStmt &Stmt, ValueMapT &GlobalMap, LoopToScevMapT &LTS);
+
+private:
+ /// @brief Repair the dominance tree after we created a copy block for @p BB.
+ ///
+ /// @returns The immediate dominator in the DT for @p BBCopy if in the region.
+ BasicBlock *repairDominance(BasicBlock *BB, BasicBlock *BBCopy,
+ DenseMap<BasicBlock *, BasicBlock *> &BlockMap);
};
}
#endif
diff --git a/polly/lib/CodeGen/BlockGenerators.cpp b/polly/lib/CodeGen/BlockGenerators.cpp
index 26ac56de57c..e1926ef6108 100644
--- a/polly/lib/CodeGen/BlockGenerators.cpp
+++ b/polly/lib/CodeGen/BlockGenerators.cpp
@@ -295,18 +295,27 @@ void BlockGenerator::copyStmt(ScopStmt &Stmt, ValueMapT &GlobalMap,
copyBB(Stmt, BB, BBMap, GlobalMap, LTS);
}
-BasicBlock *BlockGenerator::copyBB(ScopStmt &Stmt, BasicBlock *BB,
- ValueMapT &BBMap, ValueMapT &GlobalMap,
- LoopToScevMapT &LTS) {
+BasicBlock *BlockGenerator::splitBB(BasicBlock *BB) {
BasicBlock *CopyBB =
SplitBlock(Builder.GetInsertBlock(), Builder.GetInsertPoint(), &DT, &LI);
CopyBB->setName("polly.stmt." + BB->getName());
- Builder.SetInsertPoint(CopyBB->begin());
+ return CopyBB;
+}
+BasicBlock *BlockGenerator::copyBB(ScopStmt &Stmt, BasicBlock *BB,
+ ValueMapT &BBMap, ValueMapT &GlobalMap,
+ LoopToScevMapT &LTS) {
+ BasicBlock *CopyBB = splitBB(BB);
+ copyBB(Stmt, BB, CopyBB, BBMap, GlobalMap, LTS);
+ return CopyBB;
+}
+
+void BlockGenerator::copyBB(ScopStmt &Stmt, BasicBlock *BB, BasicBlock *CopyBB,
+ ValueMapT &BBMap, ValueMapT &GlobalMap,
+ LoopToScevMapT &LTS) {
+ Builder.SetInsertPoint(CopyBB->begin());
for (Instruction &Inst : *BB)
copyInstruction(Stmt, &Inst, BBMap, GlobalMap, LTS);
-
- return CopyBB;
}
VectorBlockGenerator::VectorBlockGenerator(BlockGenerator &BlockGen,
@@ -662,6 +671,19 @@ void VectorBlockGenerator::copyStmt(ScopStmt &Stmt) {
copyInstruction(Stmt, &Inst, VectorBlockMap, ScalarBlockMap);
}
+BasicBlock *RegionGenerator::repairDominance(
+ BasicBlock *BB, BasicBlock *BBCopy,
+ DenseMap<BasicBlock *, BasicBlock *> &BlockMap) {
+
+ BasicBlock *BBIDom = DT.getNode(BB)->getIDom()->getBlock();
+ BasicBlock *BBCopyIDom = BlockMap.lookup(BBIDom);
+
+ if (BBCopyIDom)
+ DT.changeImmediateDominator(BBCopy, BBCopyIDom);
+
+ return BBCopyIDom;
+}
+
void RegionGenerator::copyStmt(ScopStmt &Stmt, ValueMapT &GlobalMap,
LoopToScevMapT &LTS) {
assert(Stmt.isRegionStmt() &&
@@ -670,8 +692,11 @@ void RegionGenerator::copyStmt(ScopStmt &Stmt, ValueMapT &GlobalMap,
// The region represented by the statement.
Region *R = Stmt.getRegion();
- // The "BBMap" for the whole region.
- ValueMapT RegionMap;
+ // The "BBMaps" for the whole region.
+ DenseMap<BasicBlock *, ValueMapT> RegionMaps;
+
+ // A map from old to new blocks in the region
+ DenseMap<BasicBlock *, BasicBlock *> BlockMap;
// Iterate over all blocks in the region in a breadth-first search.
std::deque<BasicBlock *> Blocks;
@@ -683,8 +708,17 @@ void RegionGenerator::copyStmt(ScopStmt &Stmt, ValueMapT &GlobalMap,
BasicBlock *BB = Blocks.front();
Blocks.pop_front();
+ // First split the block and update dominance information.
+ BasicBlock *BBCopy = splitBB(BB);
+ BasicBlock *BBCopyIDom = repairDominance(BB, BBCopy, BlockMap);
+
+ // Get the mapping for this block and initialize it with the mapping
+ // available at its immediate dominator (in the new region).
+ ValueMapT &RegionMap = RegionMaps[BBCopy];
+ RegionMap = RegionMaps[BBCopyIDom];
+
// Copy the block with the BlockGenerator.
- BasicBlock *BBCopy = copyBB(Stmt, BB, RegionMap, GlobalMap, LTS);
+ copyBB(Stmt, BB, BBCopy, RegionMap, GlobalMap, LTS);
// And continue with new successors inside the region.
for (auto SI = succ_begin(BB), SE = succ_end(BB); SI != SE; SI++)
@@ -692,14 +726,16 @@ void RegionGenerator::copyStmt(ScopStmt &Stmt, ValueMapT &GlobalMap,
Blocks.push_back(*SI);
// In order to remap PHI nodes we store also basic block mappings.
- RegionMap[BB] = BBCopy;
+ BlockMap[BB] = BBCopy;
}
// Now create a new dedicated region exit block and add it to the region map.
- BasicBlock *RegionExit =
+ BasicBlock *ExitBBCopy =
SplitBlock(Builder.GetInsertBlock(), Builder.GetInsertPoint(), &DT, &LI);
- RegionExit->setName("polly.stmt." + R->getExit()->getName() + ".pre");
- RegionMap[R->getExit()] = RegionExit;
+ ExitBBCopy->setName("polly.stmt." + R->getExit()->getName() + ".as.exit");
+ BlockMap[R->getExit()] = ExitBBCopy;
+
+ repairDominance(R->getExit(), ExitBBCopy, BlockMap);
// As the block generator doesn't handle control flow we need to add the
// region control flow by hand after all blocks have been copied.
@@ -707,14 +743,17 @@ void RegionGenerator::copyStmt(ScopStmt &Stmt, ValueMapT &GlobalMap,
BranchInst *BI = cast<BranchInst>(BB->getTerminator());
- BasicBlock *BBCopy = cast<BasicBlock>(RegionMap[BB]);
+ BasicBlock *BBCopy = BlockMap[BB];
Instruction *BICopy = BBCopy->getTerminator();
+ ValueMapT &RegionMap = RegionMaps[BBCopy];
+ RegionMap.insert(BlockMap.begin(), BlockMap.end());
+
Builder.SetInsertPoint(BBCopy);
copyInstScalar(Stmt, BI, RegionMap, GlobalMap, LTS);
BICopy->eraseFromParent();
}
// Reset the old insert point for the build.
- Builder.SetInsertPoint(RegionExit->begin());
+ Builder.SetInsertPoint(ExitBBCopy->begin());
}
diff --git a/polly/test/Isl/CodeGen/non-affine-subregion-dominance-reuse.ll b/polly/test/Isl/CodeGen/non-affine-subregion-dominance-reuse.ll
new file mode 100644
index 00000000000..ac1539843a3
--- /dev/null
+++ b/polly/test/Isl/CodeGen/non-affine-subregion-dominance-reuse.ll
@@ -0,0 +1,74 @@
+; RUN: opt %loadPolly -polly-codegen-isl -S -verify-dom-info < %s | FileCheck %s
+;
+; Check that we do not reuse the B[i-1] GEP created in block S again in
+; block Q. Hence, we create two GEPs for B[i-1]:
+;
+; CHECK: %scevgep{{.}} = getelementptr i32* %B, i64 -1
+; CHECK: %scevgep{{.}} = getelementptr i32* %B, i64 -1
+;
+; void f(int *A, int *B) {
+; int x = 0;
+; for (int i = 0; i < 1024; i++) {
+; if (A[i]) {
+; if (i > 512)
+; S: A[i] = B[i - 1];
+; Q: A[i] += B[i - 1];
+; }
+; }
+; }
+;
+target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
+
+define void @f(i32* %A, i32* %B) {
+bb:
+ br label %bb1
+
+bb1: ; preds = %bb22, %bb
+ %indvars.iv = phi i64 [ %indvars.iv.next, %bb22 ], [ 0, %bb ]
+ %exitcond = icmp ne i64 %indvars.iv, 1024
+ br i1 %exitcond, label %bb2, label %bb23
+
+bb2: ; preds = %bb1
+ %tmp = getelementptr inbounds i32* %A, i64 %indvars.iv
+ %tmp3 = load i32* %tmp, align 4
+ %tmp4 = icmp eq i32 %tmp3, 0
+ br i1 %tmp4, label %bb21, label %bb5
+
+bb5: ; preds = %bb2
+ %tmp6 = icmp sgt i64 %indvars.iv, 512
+ br i1 %tmp6, label %bb7, label %bb13
+
+bb7: ; preds = %bb5
+ br label %bb8
+
+bb8: ; preds = %bb7
+ %tmp9 = add nsw i64 %indvars.iv, -1
+ %tmp10 = getelementptr inbounds i32* %B, i64 %tmp9
+ %tmp11 = load i32* %tmp10, align 4
+ %tmp12 = getelementptr inbounds i32* %A, i64 %indvars.iv
+ store i32 %tmp11, i32* %tmp12, align 4
+ br label %bb13
+
+bb13: ; preds = %bb8, %bb5
+ br label %bb14
+
+bb14: ; preds = %bb13
+ %tmp15 = add nsw i64 %indvars.iv, -1
+ %tmp16 = getelementptr inbounds i32* %B, i64 %tmp15
+ %tmp17 = load i32* %tmp16, align 4
+ %tmp18 = getelementptr inbounds i32* %A, i64 %indvars.iv
+ %tmp19 = load i32* %tmp18, align 4
+ %tmp20 = add nsw i32 %tmp19, %tmp17
+ store i32 %tmp20, i32* %tmp18, align 4
+ br label %bb21
+
+bb21: ; preds = %bb2, %bb14
+ br label %bb22
+
+bb22: ; preds = %bb21
+ %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
+ br label %bb1
+
+bb23: ; preds = %bb1
+ ret void
+}
diff --git a/polly/test/Isl/CodeGen/non_affine_float_compare.ll b/polly/test/Isl/CodeGen/non_affine_float_compare.ll
index 2b829d29e4b..7f5d9480316 100644
--- a/polly/test/Isl/CodeGen/non_affine_float_compare.ll
+++ b/polly/test/Isl/CodeGen/non_affine_float_compare.ll
@@ -1,4 +1,4 @@
-; RUN: opt %loadPolly -polly-codegen-isl -polly-no-early-exit -polly-allow-nonaffine-branches -S < %s | FileCheck %s
+; RUN: opt %loadPolly -polly-codegen-isl -polly-no-early-exit -polly-allow-nonaffine-branches -S -verify-dom-info < %s | FileCheck %s
;
; void f(float *A) {
; for (int i = 0; i < 1024; i++)
@@ -14,16 +14,16 @@
; CHECK: %scevgep[[R2:[0-9]*]] = getelementptr float* %scevgep{{[0-9]*}}, i64 %polly.indvar
; CHECK: %tmp6_p_scalar_ = load float* %scevgep[[R2]], align 4, !alias.scope !0, !noalias !2
; CHECK: %p_tmp7 = fcmp oeq float %tmp3_p_scalar_, %tmp6_p_scalar_
-; CHECK: br i1 %p_tmp7, label %polly.stmt.bb8, label %polly.stmt.bb12.pre
+; CHECK: br i1 %p_tmp7, label %polly.stmt.bb8, label %polly.stmt.bb12.[[R:[a-zA-Z_.0-9]*]]
; CHECK: polly.stmt.bb8:
; CHECK: %scevgep[[R3:[0-9]*]] = getelementptr float* %A, i64 %polly.indvar
; CHECK: %tmp10_p_scalar_ = load float* %scevgep[[R3]], align 4, !alias.scope !0, !noalias !2
; CHECK: %p_tmp11 = fadd float %tmp10_p_scalar_, 1.000000e+00
; CHECK: store float %p_tmp11, float* %scevgep[[R3]], align 4, !alias.scope !0, !noalias !2
-; CHECK: br label %polly.stmt.bb12.pre
+; CHECK: br label %polly.stmt.bb12.[[R]]
-; CHECK: polly.stmt.bb12.pre:
+; CHECK: polly.stmt.bb12.[[R]]:
; CHECK: br label %polly.stmt.bb12
; CHECK: polly.stmt.bb12:
OpenPOWER on IntegriCloud