diff options
| author | Chad Rosier <mcrosier@codeaurora.org> | 2014-11-14 21:09:13 +0000 | 
|---|---|---|
| committer | Chad Rosier <mcrosier@codeaurora.org> | 2014-11-14 21:09:13 +0000 | 
| commit | 1ff4c0bf0ba21869e4f7a43843fac11b1244ecf2 (patch) | |
| tree | b88bf82d81ab367e8d16a8aae446b5efc8dd66b0 /llvm/lib/Transforms/Scalar/GVN.cpp | |
| parent | 1876784bb1020c493a28158ce01cd4caf771c823 (diff) | |
| download | bcm5719-llvm-1ff4c0bf0ba21869e4f7a43843fac11b1244ecf2.tar.gz bcm5719-llvm-1ff4c0bf0ba21869e4f7a43843fac11b1244ecf2.zip | |
Reapply r221924: "[GVN] Perform Scalar PRE on gep indices that feed loads before
doing Load PRE"
This commit updates the failing test in
Analysis/TypeBasedAliasAnalysis/gvn-nonlocal-type-mismatch.ll
The failing test is sensitive to the order in which we process loads.  This
version turns on the RPO traversal instead of the while DT traversal in GVN.
The new test code is functionally same just the order of loads that are
eliminated is swapped.
This new version also fixes an issue where GVN splits a critical edge and
potentially invalidate the RPO/DT iterator.
llvm-svn: 222039
Diffstat (limited to 'llvm/lib/Transforms/Scalar/GVN.cpp')
| -rw-r--r-- | llvm/lib/Transforms/Scalar/GVN.cpp | 336 | 
1 files changed, 175 insertions, 161 deletions
| diff --git a/llvm/lib/Transforms/Scalar/GVN.cpp b/llvm/lib/Transforms/Scalar/GVN.cpp index 7dba4e2d3ab..0593fd7a236 100644 --- a/llvm/lib/Transforms/Scalar/GVN.cpp +++ b/llvm/lib/Transforms/Scalar/GVN.cpp @@ -20,6 +20,7 @@  #include "llvm/ADT/DepthFirstIterator.h"  #include "llvm/ADT/Hashing.h"  #include "llvm/ADT/MapVector.h" +#include "llvm/ADT/PostOrderIterator.h"  #include "llvm/ADT/SetVector.h"  #include "llvm/ADT/SmallPtrSet.h"  #include "llvm/ADT/Statistic.h" @@ -709,6 +710,7 @@ namespace {      void dump(DenseMap<uint32_t, Value*> &d);      bool iterateOnFunction(Function &F);      bool performPRE(Function &F); +    bool performScalarPRE(Instruction *I);      Value *findLeader(const BasicBlock *BB, uint32_t num);      void cleanupGlobalSets();      void verifyRemoved(const Instruction *I) const; @@ -1729,6 +1731,15 @@ bool GVN::processNonLocalLoad(LoadInst *LI) {      return false;    } +  // If this load follows a GEP, see if we can PRE the indices before analyzing. +  if (GetElementPtrInst *GEP = dyn_cast<GetElementPtrInst>(LI->getOperand(0))) { +    for (GetElementPtrInst::op_iterator OI = GEP->idx_begin(), +                                        OE = GEP->idx_end(); +         OI != OE; ++OI) +      if (Instruction *I = dyn_cast<Instruction>(OI->get())) +        performScalarPRE(I); +  } +    // Step 2: Analyze the availability of the load    AvailValInBlkVect ValuesPerBlock;    UnavailBlkVect UnavailableBlocks; @@ -2431,175 +2442,182 @@ bool GVN::processBlock(BasicBlock *BB) {    return ChangedFunction;  } -/// performPRE - Perform a purely local form of PRE that looks for diamond -/// control flow patterns and attempts to perform simple PRE at the join point. -bool GVN::performPRE(Function &F) { -  bool Changed = false; +bool GVN::performScalarPRE(Instruction *CurInst) {    SmallVector<std::pair<Value*, BasicBlock*>, 8> predMap; -  for (BasicBlock *CurrentBlock : depth_first(&F.getEntryBlock())) { -    // Nothing to PRE in the entry block. -    if (CurrentBlock == &F.getEntryBlock()) continue; -    // Don't perform PRE on a landing pad. -    if (CurrentBlock->isLandingPad()) continue; +  if (isa<AllocaInst>(CurInst) || isa<TerminatorInst>(CurInst) || +      isa<PHINode>(CurInst) || CurInst->getType()->isVoidTy() || +      CurInst->mayReadFromMemory() || CurInst->mayHaveSideEffects() || +      isa<DbgInfoIntrinsic>(CurInst)) +    return false; -    for (BasicBlock::iterator BI = CurrentBlock->begin(), -         BE = CurrentBlock->end(); BI != BE; ) { -      Instruction *CurInst = BI++; +  // Don't do PRE on compares. The PHI would prevent CodeGenPrepare from +  // sinking the compare again, and it would force the code generator to +  // move the i1 from processor flags or predicate registers into a general +  // purpose register. +  if (isa<CmpInst>(CurInst)) +    return false; -      if (isa<AllocaInst>(CurInst) || -          isa<TerminatorInst>(CurInst) || isa<PHINode>(CurInst) || -          CurInst->getType()->isVoidTy() || -          CurInst->mayReadFromMemory() || CurInst->mayHaveSideEffects() || -          isa<DbgInfoIntrinsic>(CurInst)) -        continue; +  // We don't currently value number ANY inline asm calls. +  if (CallInst *CallI = dyn_cast<CallInst>(CurInst)) +    if (CallI->isInlineAsm()) +      return false; -      // Don't do PRE on compares. The PHI would prevent CodeGenPrepare from -      // sinking the compare again, and it would force the code generator to -      // move the i1 from processor flags or predicate registers into a general -      // purpose register. -      if (isa<CmpInst>(CurInst)) -        continue; +  uint32_t ValNo = VN.lookup(CurInst); + +  // Look for the predecessors for PRE opportunities.  We're +  // only trying to solve the basic diamond case, where +  // a value is computed in the successor and one predecessor, +  // but not the other.  We also explicitly disallow cases +  // where the successor is its own predecessor, because they're +  // more complicated to get right. +  unsigned NumWith = 0; +  unsigned NumWithout = 0; +  BasicBlock *PREPred = nullptr; +  BasicBlock *CurrentBlock = CurInst->getParent(); +  predMap.clear(); + +  for (pred_iterator PI = pred_begin(CurrentBlock), PE = pred_end(CurrentBlock); +       PI != PE; ++PI) { +    BasicBlock *P = *PI; +    // We're not interested in PRE where the block is its +    // own predecessor, or in blocks with predecessors +    // that are not reachable. +    if (P == CurrentBlock) { +      NumWithout = 2; +      break; +    } else if (!DT->isReachableFromEntry(P)) { +      NumWithout = 2; +      break; +    } -      // We don't currently value number ANY inline asm calls. -      if (CallInst *CallI = dyn_cast<CallInst>(CurInst)) -        if (CallI->isInlineAsm()) -          continue; +    Value *predV = findLeader(P, ValNo); +    if (!predV) { +      predMap.push_back(std::make_pair(static_cast<Value *>(nullptr), P)); +      PREPred = P; +      ++NumWithout; +    } else if (predV == CurInst) { +      /* CurInst dominates this predecessor. */ +      NumWithout = 2; +      break; +    } else { +      predMap.push_back(std::make_pair(predV, P)); +      ++NumWith; +    } +  } -      uint32_t ValNo = VN.lookup(CurInst); - -      // Look for the predecessors for PRE opportunities.  We're -      // only trying to solve the basic diamond case, where -      // a value is computed in the successor and one predecessor, -      // but not the other.  We also explicitly disallow cases -      // where the successor is its own predecessor, because they're -      // more complicated to get right. -      unsigned NumWith = 0; -      unsigned NumWithout = 0; -      BasicBlock *PREPred = nullptr; -      predMap.clear(); - -      for (pred_iterator PI = pred_begin(CurrentBlock), -           PE = pred_end(CurrentBlock); PI != PE; ++PI) { -        BasicBlock *P = *PI; -        // We're not interested in PRE where the block is its -        // own predecessor, or in blocks with predecessors -        // that are not reachable. -        if (P == CurrentBlock) { -          NumWithout = 2; -          break; -        } else if (!DT->isReachableFromEntry(P))  { -          NumWithout = 2; -          break; -        } +  // Don't do PRE when it might increase code size, i.e. when +  // we would need to insert instructions in more than one pred. +  if (NumWithout != 1 || NumWith == 0) +    return false; -        Value* predV = findLeader(P, ValNo); -        if (!predV) { -          predMap.push_back(std::make_pair(static_cast<Value *>(nullptr), P)); -          PREPred = P; -          ++NumWithout; -        } else if (predV == CurInst) { -          /* CurInst dominates this predecessor. */ -          NumWithout = 2; -          break; -        } else { -          predMap.push_back(std::make_pair(predV, P)); -          ++NumWith; -        } -      } +  // Don't do PRE across indirect branch. +  if (isa<IndirectBrInst>(PREPred->getTerminator())) +    return false; -      // Don't do PRE when it might increase code size, i.e. when -      // we would need to insert instructions in more than one pred. -      if (NumWithout != 1 || NumWith == 0) -        continue; +  // We can't do PRE safely on a critical edge, so instead we schedule +  // the edge to be split and perform the PRE the next time we iterate +  // on the function. +  unsigned SuccNum = GetSuccessorNumber(PREPred, CurrentBlock); +  if (isCriticalEdge(PREPred->getTerminator(), SuccNum)) { +    toSplit.push_back(std::make_pair(PREPred->getTerminator(), SuccNum)); +    return false; +  } -      // Don't do PRE across indirect branch. -      if (isa<IndirectBrInst>(PREPred->getTerminator())) -        continue; +  // Instantiate the expression in the predecessor that lacked it. +  // Because we are going top-down through the block, all value numbers +  // will be available in the predecessor by the time we need them.  Any +  // that weren't originally present will have been instantiated earlier +  // in this loop. +  Instruction *PREInstr = CurInst->clone(); +  bool success = true; +  for (unsigned i = 0, e = CurInst->getNumOperands(); i != e; ++i) { +    Value *Op = PREInstr->getOperand(i); +    if (isa<Argument>(Op) || isa<Constant>(Op) || isa<GlobalValue>(Op)) +      continue; -      // We can't do PRE safely on a critical edge, so instead we schedule -      // the edge to be split and perform the PRE the next time we iterate -      // on the function. -      unsigned SuccNum = GetSuccessorNumber(PREPred, CurrentBlock); -      if (isCriticalEdge(PREPred->getTerminator(), SuccNum)) { -        toSplit.push_back(std::make_pair(PREPred->getTerminator(), SuccNum)); -        continue; -      } +    if (Value *V = findLeader(PREPred, VN.lookup(Op))) { +      PREInstr->setOperand(i, V); +    } else { +      success = false; +      break; +    } +  } -      // Instantiate the expression in the predecessor that lacked it. -      // Because we are going top-down through the block, all value numbers -      // will be available in the predecessor by the time we need them.  Any -      // that weren't originally present will have been instantiated earlier -      // in this loop. -      Instruction *PREInstr = CurInst->clone(); -      bool success = true; -      for (unsigned i = 0, e = CurInst->getNumOperands(); i != e; ++i) { -        Value *Op = PREInstr->getOperand(i); -        if (isa<Argument>(Op) || isa<Constant>(Op) || isa<GlobalValue>(Op)) -          continue; +  // Fail out if we encounter an operand that is not available in +  // the PRE predecessor.  This is typically because of loads which +  // are not value numbered precisely. +  if (!success) { +    DEBUG(verifyRemoved(PREInstr)); +    delete PREInstr; +    return false; +  } -        if (Value *V = findLeader(PREPred, VN.lookup(Op))) { -          PREInstr->setOperand(i, V); -        } else { -          success = false; -          break; -        } -      } +  PREInstr->insertBefore(PREPred->getTerminator()); +  PREInstr->setName(CurInst->getName() + ".pre"); +  PREInstr->setDebugLoc(CurInst->getDebugLoc()); +  VN.add(PREInstr, ValNo); +  ++NumGVNPRE; -      // Fail out if we encounter an operand that is not available in -      // the PRE predecessor.  This is typically because of loads which -      // are not value numbered precisely. -      if (!success) { -        DEBUG(verifyRemoved(PREInstr)); -        delete PREInstr; -        continue; -      } +  // Update the availability map to include the new instruction. +  addToLeaderTable(ValNo, PREInstr, PREPred); -      PREInstr->insertBefore(PREPred->getTerminator()); -      PREInstr->setName(CurInst->getName() + ".pre"); -      PREInstr->setDebugLoc(CurInst->getDebugLoc()); -      VN.add(PREInstr, ValNo); -      ++NumGVNPRE; - -      // Update the availability map to include the new instruction. -      addToLeaderTable(ValNo, PREInstr, PREPred); - -      // Create a PHI to make the value available in this block. -      PHINode* Phi = PHINode::Create(CurInst->getType(), predMap.size(), -                                     CurInst->getName() + ".pre-phi", -                                     CurrentBlock->begin()); -      for (unsigned i = 0, e = predMap.size(); i != e; ++i) { -        if (Value *V = predMap[i].first) -          Phi->addIncoming(V, predMap[i].second); -        else -          Phi->addIncoming(PREInstr, PREPred); -      } +  // Create a PHI to make the value available in this block. +  PHINode *Phi = +      PHINode::Create(CurInst->getType(), predMap.size(), +                      CurInst->getName() + ".pre-phi", CurrentBlock->begin()); +  for (unsigned i = 0, e = predMap.size(); i != e; ++i) { +    if (Value *V = predMap[i].first) +      Phi->addIncoming(V, predMap[i].second); +    else +      Phi->addIncoming(PREInstr, PREPred); +  } + +  VN.add(Phi, ValNo); +  addToLeaderTable(ValNo, Phi, CurrentBlock); +  Phi->setDebugLoc(CurInst->getDebugLoc()); +  CurInst->replaceAllUsesWith(Phi); +  if (Phi->getType()->getScalarType()->isPointerTy()) { +    // Because we have added a PHI-use of the pointer value, it has now +    // "escaped" from alias analysis' perspective.  We need to inform +    // AA of this. +    for (unsigned ii = 0, ee = Phi->getNumIncomingValues(); ii != ee; ++ii) { +      unsigned jj = PHINode::getOperandNumForIncomingValue(ii); +      VN.getAliasAnalysis()->addEscapingUse(Phi->getOperandUse(jj)); +    } -      VN.add(Phi, ValNo); -      addToLeaderTable(ValNo, Phi, CurrentBlock); -      Phi->setDebugLoc(CurInst->getDebugLoc()); -      CurInst->replaceAllUsesWith(Phi); -      if (Phi->getType()->getScalarType()->isPointerTy()) { -        // Because we have added a PHI-use of the pointer value, it has now -        // "escaped" from alias analysis' perspective.  We need to inform -        // AA of this. -        for (unsigned ii = 0, ee = Phi->getNumIncomingValues(); ii != ee; -             ++ii) { -          unsigned jj = PHINode::getOperandNumForIncomingValue(ii); -          VN.getAliasAnalysis()->addEscapingUse(Phi->getOperandUse(jj)); -        } +    if (MD) +      MD->invalidateCachedPointerInfo(Phi); +  } +  VN.erase(CurInst); +  removeFromLeaderTable(ValNo, CurInst, CurrentBlock); -        if (MD) -          MD->invalidateCachedPointerInfo(Phi); -      } -      VN.erase(CurInst); -      removeFromLeaderTable(ValNo, CurInst, CurrentBlock); +  DEBUG(dbgs() << "GVN PRE removed: " << *CurInst << '\n'); +  if (MD) +    MD->removeInstruction(CurInst); +  DEBUG(verifyRemoved(CurInst)); +  CurInst->eraseFromParent(); +  return true; +} + +/// performPRE - Perform a purely local form of PRE that looks for diamond +/// control flow patterns and attempts to perform simple PRE at the join point. +bool GVN::performPRE(Function &F) { +  bool Changed = false; +  for (BasicBlock *CurrentBlock : depth_first(&F.getEntryBlock())) { +    // Nothing to PRE in the entry block. +    if (CurrentBlock == &F.getEntryBlock()) +      continue; -      DEBUG(dbgs() << "GVN PRE removed: " << *CurInst << '\n'); -      if (MD) MD->removeInstruction(CurInst); -      DEBUG(verifyRemoved(CurInst)); -      CurInst->eraseFromParent(); -      Changed = true; +    // Don't perform PRE on a landing pad. +    if (CurrentBlock->isLandingPad()) +      continue; + +    for (BasicBlock::iterator BI = CurrentBlock->begin(), +                              BE = CurrentBlock->end(); +         BI != BE;) { +      Instruction *CurInst = BI++; +      Changed = performScalarPRE(CurInst);      }    } @@ -2637,25 +2655,21 @@ bool GVN::iterateOnFunction(Function &F) {    // Top-down walk of the dominator tree    bool Changed = false; -#if 0 -  // Needed for value numbering with phi construction to work. -  ReversePostOrderTraversal<Function*> RPOT(&F); -  for (ReversePostOrderTraversal<Function*>::rpo_iterator RI = RPOT.begin(), -       RE = RPOT.end(); RI != RE; ++RI) -    Changed |= processBlock(*RI); -#else    // Save the blocks this function have before transformation begins. GVN may    // split critical edge, and hence may invalidate the RPO/DT iterator.    //    std::vector<BasicBlock *> BBVect;    BBVect.reserve(256); -  for (DomTreeNode *X : depth_first(DT->getRootNode())) -    BBVect.push_back(X->getBlock()); +  // Needed for value numbering with phi construction to work. +  ReversePostOrderTraversal<Function *> RPOT(&F); +  for (ReversePostOrderTraversal<Function *>::rpo_iterator RI = RPOT.begin(), +                                                           RE = RPOT.end(); +       RI != RE; ++RI) +    BBVect.push_back(*RI);    for (std::vector<BasicBlock *>::iterator I = BBVect.begin(), E = BBVect.end();         I != E; I++)      Changed |= processBlock(*I); -#endif    return Changed;  } | 

