diff options
Diffstat (limited to 'clang/lib')
| -rw-r--r-- | clang/lib/AST/OpenMPClause.cpp | 12 | ||||
| -rw-r--r-- | clang/lib/AST/StmtProfile.cpp | 7 | ||||
| -rw-r--r-- | clang/lib/CodeGen/CGExpr.cpp | 33 | ||||
| -rw-r--r-- | clang/lib/CodeGen/CGOpenMPRuntime.cpp | 41 | ||||
| -rw-r--r-- | clang/lib/CodeGen/CGOpenMPRuntime.h | 19 | ||||
| -rw-r--r-- | clang/lib/CodeGen/CGStmtOpenMP.cpp | 5 | ||||
| -rw-r--r-- | clang/lib/Sema/SemaOpenMP.cpp | 46 | ||||
| -rw-r--r-- | clang/lib/Serialization/ASTReader.cpp | 5 | ||||
| -rw-r--r-- | clang/lib/Serialization/ASTWriter.cpp | 2 | 
9 files changed, 147 insertions, 23 deletions
| diff --git a/clang/lib/AST/OpenMPClause.cpp b/clang/lib/AST/OpenMPClause.cpp index f062c3e463a..790b4401229 100644 --- a/clang/lib/AST/OpenMPClause.cpp +++ b/clang/lib/AST/OpenMPClause.cpp @@ -1162,8 +1162,8 @@ OMPNontemporalClause *OMPNontemporalClause::Create(const ASTContext &C,                                                     SourceLocation LParenLoc,                                                     SourceLocation EndLoc,                                                     ArrayRef<Expr *> VL) { -  // Allocate space for nontemporal variables. -  void *Mem = C.Allocate(totalSizeToAlloc<Expr *>(VL.size())); +  // Allocate space for nontemporal variables + private references. +  void *Mem = C.Allocate(totalSizeToAlloc<Expr *>(2 * VL.size()));    auto *Clause =        new (Mem) OMPNontemporalClause(StartLoc, LParenLoc, EndLoc, VL.size());    Clause->setVarRefs(VL); @@ -1172,10 +1172,16 @@ OMPNontemporalClause *OMPNontemporalClause::Create(const ASTContext &C,  OMPNontemporalClause *OMPNontemporalClause::CreateEmpty(const ASTContext &C,                                                          unsigned N) { -  void *Mem = C.Allocate(totalSizeToAlloc<Expr *>(N)); +  void *Mem = C.Allocate(totalSizeToAlloc<Expr *>(2 * N));    return new (Mem) OMPNontemporalClause(N);  } +void OMPNontemporalClause::setPrivateRefs(ArrayRef<Expr *> VL) { +  assert(VL.size() == varlist_size() && "Number of private references is not " +                                        "the same as the preallocated buffer"); +  std::copy(VL.begin(), VL.end(), varlist_end()); +} +  //===----------------------------------------------------------------------===//  //  OpenMP clauses printing methods  //===----------------------------------------------------------------------===// diff --git a/clang/lib/AST/StmtProfile.cpp b/clang/lib/AST/StmtProfile.cpp index 56a65e8deb9..2aa5106e90f 100644 --- a/clang/lib/AST/StmtProfile.cpp +++ b/clang/lib/AST/StmtProfile.cpp @@ -769,10 +769,13 @@ void OMPClauseProfiler::VisitOMPIsDevicePtrClause(      const OMPIsDevicePtrClause *C) {    VisitOMPClauseList(C);  } -void OMPClauseProfiler::VisitOMPNontemporalClause(const OMPNontemporalClause *C) { +void OMPClauseProfiler::VisitOMPNontemporalClause( +    const OMPNontemporalClause *C) {    VisitOMPClauseList(C); +  for (auto *E : C->private_refs()) +    Profiler->VisitStmt(E);  } -} +} // namespace  void  StmtProfiler::VisitOMPExecutableDirective(const OMPExecutableDirective *S) { diff --git a/clang/lib/CodeGen/CGExpr.cpp b/clang/lib/CodeGen/CGExpr.cpp index cd42faefab0..c729037852e 100644 --- a/clang/lib/CodeGen/CGExpr.cpp +++ b/clang/lib/CodeGen/CGExpr.cpp @@ -2566,21 +2566,35 @@ LValue CodeGenFunction::EmitDeclRefLValue(const DeclRefExpr *E) {        VD = VD->getCanonicalDecl();        if (auto *FD = LambdaCaptureFields.lookup(VD))          return EmitCapturedFieldLValue(*this, FD, CXXABIThisValue); -      else if (CapturedStmtInfo) { +      if (CapturedStmtInfo) {          auto I = LocalDeclMap.find(VD);          if (I != LocalDeclMap.end()) { +          LValue CapLVal;            if (VD->getType()->isReferenceType()) -            return EmitLoadOfReferenceLValue(I->second, VD->getType(), -                                             AlignmentSource::Decl); -          return MakeAddrLValue(I->second, T); +            CapLVal = EmitLoadOfReferenceLValue(I->second, VD->getType(), +                                                AlignmentSource::Decl); +          else +            CapLVal = MakeAddrLValue(I->second, T); +          // Mark lvalue as nontemporal if the variable is marked as nontemporal +          // in simd context. +          if (getLangOpts().OpenMP && +              CGM.getOpenMPRuntime().isNontemporalDecl(VD)) +            CapLVal.setNontemporal(/*Value=*/true); +          return CapLVal;          }          LValue CapLVal =              EmitCapturedFieldLValue(*this, CapturedStmtInfo->lookup(VD),                                      CapturedStmtInfo->getContextValue()); -        return MakeAddrLValue( +        CapLVal = MakeAddrLValue(              Address(CapLVal.getPointer(*this), getContext().getDeclAlign(VD)),              CapLVal.getType(), LValueBaseInfo(AlignmentSource::Decl),              CapLVal.getTBAAInfo()); +        // Mark lvalue as nontemporal if the variable is marked as nontemporal +        // in simd context. +        if (getLangOpts().OpenMP && +            CGM.getOpenMPRuntime().isNontemporalDecl(VD)) +          CapLVal.setNontemporal(/*Value=*/true); +        return CapLVal;        }        assert(isa<BlockDecl>(CurCodeDecl)); @@ -3929,6 +3943,15 @@ LValue CodeGenFunction::EmitMemberExpr(const MemberExpr *E) {    if (auto *Field = dyn_cast<FieldDecl>(ND)) {      LValue LV = EmitLValueForField(BaseLV, Field);      setObjCGCLValueClass(getContext(), E, LV); +    if (getLangOpts().OpenMP) { +      // If the member was explicitly marked as nontemporal, mark it as +      // nontemporal. If the base lvalue is marked as nontemporal, mark access +      // to children as nontemporal too. +      if ((IsWrappedCXXThis(BaseExpr) && +           CGM.getOpenMPRuntime().isNontemporalDecl(Field)) || +          BaseLV.isNontemporal()) +        LV.setNontemporal(/*Value=*/true); +    }      return LV;    } diff --git a/clang/lib/CodeGen/CGOpenMPRuntime.cpp b/clang/lib/CodeGen/CGOpenMPRuntime.cpp index 1aae18b4504..2a53e999353 100644 --- a/clang/lib/CodeGen/CGOpenMPRuntime.cpp +++ b/clang/lib/CodeGen/CGOpenMPRuntime.cpp @@ -17,6 +17,7 @@  #include "CodeGenFunction.h"  #include "clang/AST/Attr.h"  #include "clang/AST/Decl.h" +#include "clang/AST/OpenMPClause.h"  #include "clang/AST/StmtOpenMP.h"  #include "clang/Basic/BitmaskEnum.h"  #include "clang/CodeGen/ConstantInitBuilder.h" @@ -11341,6 +11342,46 @@ bool CGOpenMPRuntime::emitDeclareVariant(GlobalDecl GD, bool IsForDefinition) {    return true;  } +CGOpenMPRuntime::NontemporalDeclsRAII::NontemporalDeclsRAII( +    CodeGenModule &CGM, const OMPLoopDirective &S) +    : CGM(CGM), NeedToPush(S.hasClausesOfKind<OMPNontemporalClause>()) { +  assert(CGM.getLangOpts().OpenMP && "Not in OpenMP mode."); +  if (!NeedToPush) +    return; +  NontemporalDeclsSet &DS = +      CGM.getOpenMPRuntime().NontemporalDeclsStack.emplace_back(); +  for (const auto *C : S.getClausesOfKind<OMPNontemporalClause>()) { +    for (const Stmt *Ref : C->private_refs()) { +      const auto *SimpleRefExpr = cast<Expr>(Ref)->IgnoreParenImpCasts(); +      const ValueDecl *VD; +      if (const auto *DRE = dyn_cast<DeclRefExpr>(SimpleRefExpr)) { +        VD = DRE->getDecl(); +      } else { +        const auto *ME = cast<MemberExpr>(SimpleRefExpr); +        assert((ME->isImplicitCXXThis() || +                isa<CXXThisExpr>(ME->getBase()->IgnoreParenImpCasts())) && +               "Expected member of current class."); +        VD = ME->getMemberDecl(); +      } +      DS.insert(VD); +    } +  } +} + +CGOpenMPRuntime::NontemporalDeclsRAII::~NontemporalDeclsRAII() { +  if (!NeedToPush) +    return; +  CGM.getOpenMPRuntime().NontemporalDeclsStack.pop_back(); +} + +bool CGOpenMPRuntime::isNontemporalDecl(const ValueDecl *VD) const { +  assert(CGM.getLangOpts().OpenMP && "Not in OpenMP mode."); + +  return llvm::any_of( +      CGM.getOpenMPRuntime().NontemporalDeclsStack, +      [VD](const NontemporalDeclsSet &Set) { return Set.count(VD) > 0; }); +} +  llvm::Function *CGOpenMPSIMDRuntime::emitParallelOutlinedFunction(      const OMPExecutableDirective &D, const VarDecl *ThreadIDVar,      OpenMPDirectiveKind InnermostKind, const RegionCodeGenTy &CodeGen) { diff --git a/clang/lib/CodeGen/CGOpenMPRuntime.h b/clang/lib/CodeGen/CGOpenMPRuntime.h index d806c27fdcb..f1582457ed2 100644 --- a/clang/lib/CodeGen/CGOpenMPRuntime.h +++ b/clang/lib/CodeGen/CGOpenMPRuntime.h @@ -211,6 +211,16 @@ public:      ~DisableAutoDeclareTargetRAII();    }; +  /// Manages list of nontemporal decls for the specified directive. +  class NontemporalDeclsRAII { +    CodeGenModule &CGM; +    const bool NeedToPush; + +  public: +    NontemporalDeclsRAII(CodeGenModule &CGM, const OMPLoopDirective &S); +    ~NontemporalDeclsRAII(); +  }; +  protected:    CodeGenModule &CGM;    StringRef FirstSeparator, Separator; @@ -650,6 +660,11 @@ private:                    std::pair<GlobalDecl, GlobalDecl>>        DeferredVariantFunction; +  using NontemporalDeclsSet = llvm::SmallDenseSet<CanonicalDeclPtr<const Decl>>; +  /// Stack for list of declarations in current context marked as nontemporal. +  /// The set is the union of all current stack elements. +  llvm::SmallVector<NontemporalDeclsSet, 4> NontemporalDeclsStack; +    /// Flag for keeping track of weather a requires unified_shared_memory    /// directive is present.    bool HasRequiresUnifiedSharedMemory = false; @@ -1663,6 +1678,10 @@ public:    /// Emits the definition of the declare variant function.    virtual bool emitDeclareVariant(GlobalDecl GD, bool IsForDefinition); + +  /// Checks if the \p VD variable is marked as nontemporal declaration in +  /// current context. +  bool isNontemporalDecl(const ValueDecl *VD) const;  };  /// Class supports emissionof SIMD-only code. diff --git a/clang/lib/CodeGen/CGStmtOpenMP.cpp b/clang/lib/CodeGen/CGStmtOpenMP.cpp index e8a3790e3b5..a2a59b64ddb 100644 --- a/clang/lib/CodeGen/CGStmtOpenMP.cpp +++ b/clang/lib/CodeGen/CGStmtOpenMP.cpp @@ -1803,8 +1803,9 @@ static LValue EmitOMPHelperVar(CodeGenFunction &CGF,  static void emitCommonSimdLoop(CodeGenFunction &CGF, const OMPLoopDirective &S,                                 const RegionCodeGenTy &SimdInitGen,                                 const RegionCodeGenTy &BodyCodeGen) { -  auto &&ThenGen = [&SimdInitGen, &BodyCodeGen](CodeGenFunction &CGF, -                                                PrePostActionTy &) { +  auto &&ThenGen = [&S, &SimdInitGen, &BodyCodeGen](CodeGenFunction &CGF, +                                                    PrePostActionTy &) { +    CGOpenMPRuntime::NontemporalDeclsRAII NontemporalsRegion(CGF.CGM, S);      CodeGenFunction::OMPLocalDeclMapRAII Scope(CGF);      SimdInitGen(CGF); diff --git a/clang/lib/Sema/SemaOpenMP.cpp b/clang/lib/Sema/SemaOpenMP.cpp index 915bf53d06e..7365fda62be 100644 --- a/clang/lib/Sema/SemaOpenMP.cpp +++ b/clang/lib/Sema/SemaOpenMP.cpp @@ -2230,6 +2230,11 @@ void Sema::EndOpenMPClause() {  static void checkAllocateClauses(Sema &S, DSAStackTy *Stack,                                   ArrayRef<OMPClause *> Clauses); +static std::pair<ValueDecl *, bool> +getPrivateItem(Sema &S, Expr *&RefExpr, SourceLocation &ELoc, +               SourceRange &ERange, bool AllowArraySection = false); +static DeclRefExpr *buildCapture(Sema &S, ValueDecl *D, Expr *CaptureExpr, +                                 bool WithInit);  void Sema::EndOpenMPDSABlock(Stmt *CurDirective) {    // OpenMP [2.14.3.5, Restrictions, C/C++, p.1] @@ -2274,6 +2279,31 @@ void Sema::EndOpenMPDSABlock(Stmt *CurDirective) {            }          }          Clause->setPrivateCopies(PrivateCopies); +        continue; +      } +      // Finalize nontemporal clause by handling private copies, if any. +      if (auto *Clause = dyn_cast<OMPNontemporalClause>(C)) { +        SmallVector<Expr *, 8> PrivateRefs; +        for (Expr *RefExpr : Clause->varlists()) { +          assert(RefExpr && "NULL expr in OpenMP nontemporal clause."); +          SourceLocation ELoc; +          SourceRange ERange; +          Expr *SimpleRefExpr = RefExpr; +          auto Res = getPrivateItem(*this, SimpleRefExpr, ELoc, ERange); +          if (Res.second) +            // It will be analyzed later. +            PrivateRefs.push_back(RefExpr); +          ValueDecl *D = Res.first; +          if (!D) +            continue; + +          const DSAStackTy::DSAVarData DVar = +              DSAStack->getTopDSA(D, /*FromParent=*/false); +          PrivateRefs.push_back(DVar.PrivateCopy ? DVar.PrivateCopy +                                                 : SimpleRefExpr); +        } +        Clause->setPrivateRefs(PrivateRefs); +        continue;        }      }      // Check allocate clauses. @@ -4262,9 +4292,10 @@ static bool checkIfClauses(Sema &S, OpenMPDirectiveKind Kind,    return ErrorFound;  } -static std::pair<ValueDecl *, bool> -getPrivateItem(Sema &S, Expr *&RefExpr, SourceLocation &ELoc, -               SourceRange &ERange, bool AllowArraySection = false) { +static std::pair<ValueDecl *, bool> getPrivateItem(Sema &S, Expr *&RefExpr, +                                                   SourceLocation &ELoc, +                                                   SourceRange &ERange, +                                                   bool AllowArraySection) {    if (RefExpr->isTypeDependent() || RefExpr->isValueDependent() ||        RefExpr->containsUnexpandedParameterPack())      return std::make_pair(nullptr, true); @@ -17172,8 +17203,6 @@ OMPClause *Sema::ActOnOpenMPNontemporalClause(ArrayRef<Expr *> VarList,      if (!D)        continue; -    auto *VD = dyn_cast<VarDecl>(D); -      // OpenMP 5.0, 2.9.3.1 simd Construct, Restrictions.      // A list-item cannot appear in more than one nontemporal clause.      if (const Expr *PrevRef = @@ -17185,12 +17214,7 @@ OMPClause *Sema::ActOnOpenMPNontemporalClause(ArrayRef<Expr *> VarList,        continue;      } -    DeclRefExpr *Ref = nullptr; -    if (!VD && isOpenMPCapturedDecl(D) && !CurContext->isDependentContext()) -      Ref = buildCapture(*this, D, SimpleRefExpr, /*WithInit=*/true); -    Vars.push_back((VD || !Ref || CurContext->isDependentContext()) -                       ? RefExpr->IgnoreParens() -                       : Ref); +    Vars.push_back(RefExpr);    }    if (Vars.empty()) diff --git a/clang/lib/Serialization/ASTReader.cpp b/clang/lib/Serialization/ASTReader.cpp index 9258a6fb126..032ce888969 100644 --- a/clang/lib/Serialization/ASTReader.cpp +++ b/clang/lib/Serialization/ASTReader.cpp @@ -12466,4 +12466,9 @@ void OMPClauseReader::VisitOMPNontemporalClause(OMPNontemporalClause *C) {    for (unsigned i = 0; i != NumVars; ++i)      Vars.push_back(Record.readSubExpr());    C->setVarRefs(Vars); +  Vars.clear(); +  Vars.reserve(NumVars); +  for (unsigned i = 0; i != NumVars; ++i) +    Vars.push_back(Record.readSubExpr()); +  C->setPrivateRefs(Vars);  } diff --git a/clang/lib/Serialization/ASTWriter.cpp b/clang/lib/Serialization/ASTWriter.cpp index a632072d01b..2e2ce0e875d 100644 --- a/clang/lib/Serialization/ASTWriter.cpp +++ b/clang/lib/Serialization/ASTWriter.cpp @@ -6544,4 +6544,6 @@ void OMPClauseWriter::VisitOMPNontemporalClause(OMPNontemporalClause *C) {    Record.AddSourceLocation(C->getLParenLoc());    for (auto *VE : C->varlists())      Record.AddStmt(VE); +  for (auto *E : C->private_refs()) +    Record.AddStmt(E);  } | 

