diff options
Diffstat (limited to 'llvm/lib')
-rw-r--r-- | llvm/lib/Analysis/ConstantFolding.cpp | 35 | ||||
-rw-r--r-- | llvm/lib/Analysis/InstructionSimplify.cpp | 26 |
2 files changed, 42 insertions, 19 deletions
diff --git a/llvm/lib/Analysis/ConstantFolding.cpp b/llvm/lib/Analysis/ConstantFolding.cpp index 96a2d02ed5b..6c471ab4504 100644 --- a/llvm/lib/Analysis/ConstantFolding.cpp +++ b/llvm/lib/Analysis/ConstantFolding.cpp @@ -1854,32 +1854,39 @@ Constant *ConstantFoldVectorCall(StringRef Name, unsigned IntrinsicID, auto *SrcPtr = Operands[0]; auto *Mask = Operands[2]; auto *Passthru = Operands[3]; + Constant *VecData = ConstantFoldLoadFromConstPtr(SrcPtr, VTy, DL); - if (!VecData) - return nullptr; SmallVector<Constant *, 32> NewElements; for (unsigned I = 0, E = VTy->getNumElements(); I != E; ++I) { - auto *MaskElt = - dyn_cast_or_null<ConstantInt>(Mask->getAggregateElement(I)); + auto *MaskElt = Mask->getAggregateElement(I); if (!MaskElt) break; - if (MaskElt->isZero()) { - auto *PassthruElt = Passthru->getAggregateElement(I); + auto *PassthruElt = Passthru->getAggregateElement(I); + auto *VecElt = VecData ? VecData->getAggregateElement(I) : nullptr; + if (isa<UndefValue>(MaskElt)) { + if (PassthruElt) + NewElements.push_back(PassthruElt); + else if (VecElt) + NewElements.push_back(VecElt); + else + return nullptr; + } + if (MaskElt->isNullValue()) { if (!PassthruElt) - break; + return nullptr; NewElements.push_back(PassthruElt); - } else { - assert(MaskElt->isOne()); - auto *VecElt = VecData->getAggregateElement(I); + } else if (MaskElt->isOneValue()) { if (!VecElt) - break; + return nullptr; NewElements.push_back(VecElt); + } else { + return nullptr; } } - if (NewElements.size() == VTy->getNumElements()) - return ConstantVector::get(NewElements); - return nullptr; + if (NewElements.size() != VTy->getNumElements()) + return nullptr; + return ConstantVector::get(NewElements); } for (unsigned I = 0, E = VTy->getNumElements(); I != E; ++I) { diff --git a/llvm/lib/Analysis/InstructionSimplify.cpp b/llvm/lib/Analysis/InstructionSimplify.cpp index 609cd26bcd0..0cb2c78afb4 100644 --- a/llvm/lib/Analysis/InstructionSimplify.cpp +++ b/llvm/lib/Analysis/InstructionSimplify.cpp @@ -3944,6 +3944,22 @@ static Value *SimplifyRelativeLoad(Constant *Ptr, Constant *Offset, return ConstantExpr::getBitCast(LoadedLHSPtr, Int8PtrTy); } +static bool maskIsAllZeroOrUndef(Value *Mask) { + auto *ConstMask = dyn_cast<Constant>(Mask); + if (!ConstMask) + return false; + if (ConstMask->isNullValue() || isa<UndefValue>(ConstMask)) + return true; + for (unsigned I = 0, E = ConstMask->getType()->getVectorNumElements(); I != E; + ++I) { + if (auto *MaskElt = ConstMask->getAggregateElement(I)) + if (MaskElt->isNullValue() || isa<UndefValue>(MaskElt)) + continue; + return false; + } + return true; +} + template <typename IterTy> static Value *SimplifyIntrinsic(Function *F, IterTy ArgBegin, IterTy ArgEnd, const Query &Q, unsigned MaxRecurse) { @@ -3993,11 +4009,11 @@ static Value *SimplifyIntrinsic(Function *F, IterTy ArgBegin, IterTy ArgEnd, // Simplify calls to llvm.masked.load.* if (IID == Intrinsic::masked_load) { - IterTy MaskArg = ArgBegin + 2; - // If the mask is all zeros, the "passthru" argument is the result. - if (auto *ConstMask = dyn_cast<Constant>(*MaskArg)) - if (ConstMask->isNullValue()) - return ArgBegin[3]; + Value *MaskArg = ArgBegin[2]; + Value *PassthruArg = ArgBegin[3]; + // If the mask is all zeros or undef, the "passthru" argument is the result. + if (maskIsAllZeroOrUndef(MaskArg)) + return PassthruArg; } // Perform idempotent optimizations |