diff options
| author | Chris Lattner <sabre@nondot.org> | 2010-12-19 18:22:06 +0000 | 
|---|---|---|
| committer | Chris Lattner <sabre@nondot.org> | 2010-12-19 18:22:06 +0000 | 
| commit | c56c8453778cc070feee78f4a80fe85f6aa2d85c (patch) | |
| tree | 8e894b3252e1c6ab107107534eb7ba4f01c5aad9 /llvm/lib/Transforms/InstCombine | |
| parent | 713ab3796512498b5f4e6ed79ea2ff4e6aa8df9b (diff) | |
| download | bcm5719-llvm-c56c8453778cc070feee78f4a80fe85f6aa2d85c.tar.gz bcm5719-llvm-c56c8453778cc070feee78f4a80fe85f6aa2d85c.zip | |
fix another miscompile in the llvm.sadd formation logic: it wasn't 
checking to see if the high bits of the original add result were dead.
Inserting a smaller add and zexting back to that size is not good enough.
This is likely to be the fix for 8816.
llvm-svn: 122177
Diffstat (limited to 'llvm/lib/Transforms/InstCombine')
| -rw-r--r-- | llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp | 43 | 
1 files changed, 39 insertions, 4 deletions
| diff --git a/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp b/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp index 376a38edda3..11426863f61 100644 --- a/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp +++ b/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp @@ -1585,6 +1585,11 @@ Instruction *InstCombiner::visitICmpInstWithCastAndCast(ICmpInst &ICI) {  /// ProcessUGT_ADDCST_ADD - The caller has matched a pattern of the form:  ///   I = icmp ugt (add (add A, B), CI2), CI1 +/// If this is of the form: +///   sum = a + b +///   if (sum+128 >u 255) +/// Then replace it with llvm.sadd.with.overflow.i8. +///  static Instruction *ProcessUGT_ADDCST_ADD(ICmpInst &I, Value *A, Value *B,                                            ConstantInt *CI2, ConstantInt *CI1,                                            InstCombiner::BuilderTy *Builder) { @@ -1595,9 +1600,41 @@ static Instruction *ProcessUGT_ADDCST_ADD(ICmpInst &I, Value *A, Value *B,    // In order to eliminate the add-with-constant, the compare can be its only    // use. -  Value *AddWithCst = I.getOperand(0); +  Instruction *AddWithCst = cast<Instruction>(I.getOperand(0));    if (!AddWithCst->hasOneUse()) return 0; - +   +  // If CI2 is 2^7, 2^15, 2^31, then it might be an sadd.with.overflow. +  if (!CI2->getValue().isPowerOf2()) return 0; +  unsigned NewWidth = CI2->getValue().countTrailingZeros(); +  if (NewWidth != 7 && NewWidth != 15 && NewWidth != 31) return 0; +     +  // The width of the new add formed is 1 more than the bias. +  ++NewWidth; +   +  // Check to see that CI1 is an all-ones value with NewWidth bits. +  if (CI1->getBitWidth() == NewWidth || +      CI1->getValue() != APInt::getLowBitsSet(CI1->getBitWidth(), NewWidth)) +    return 0; +   +  // In order to replace the original add with a narrower  +  // llvm.sadd.with.overflow, the only uses allowed are the add-with-constant +  // and truncates that discard the high bits of the add.  Verify that this is +  // the case. +  Instruction *OrigAdd = cast<Instruction>(AddWithCst->getOperand(0)); +  for (Value::use_iterator UI = OrigAdd->use_begin(), E = OrigAdd->use_end(); +       UI != E; ++UI) { +    if (*UI == AddWithCst) continue; +     +    // Only accept truncates for now.  We would really like a nice recursive +    // predicate like SimplifyDemandedBits, but which goes downwards the use-def +    // chain to see which bits of a value are actually demanded.  If the +    // original add had another add which was then immediately truncated, we +    // could still do the transformation. +    TruncInst *TI = dyn_cast<TruncInst>(*UI); +    if (TI == 0 || +        TI->getType()->getPrimitiveSizeInBits() > NewWidth) return 0; +  } +      const IntegerType *WideType = cast<IntegerType>(CI1->getType());    unsigned WideWidth = WideType->getBitWidth();    unsigned NarrowWidth = WideWidth / 2; @@ -1630,8 +1667,6 @@ static Instruction *ProcessUGT_ADDCST_ADD(ICmpInst &I, Value *A, Value *B,    // If the pattern matches, truncate the inputs to the narrower type and    // use the sadd_with_overflow intrinsic to efficiently compute both the    // result and the overflow bit. -  Instruction *OrigAdd = -  cast<Instruction>(cast<Instruction>(I.getOperand(0))->getOperand(0));    Builder->SetInsertPoint(OrigAdd->getParent(),                            BasicBlock::iterator(OrigAdd)); | 

