//===----- CGOpenCLRuntime.cpp - Interface to OpenCL Runtimes -------------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This provides an abstract class for OpenCL code generation. Concrete // subclasses of this implement code generation for specific OpenCL // runtime libraries. // //===----------------------------------------------------------------------===// #include "CGOpenCLRuntime.h" #include "CodeGenFunction.h" #include "TargetInfo.h" #include "clang/CodeGen/ConstantInitBuilder.h" #include "llvm/IR/DerivedTypes.h" #include "llvm/IR/GlobalValue.h" #include using namespace clang; using namespace CodeGen; CGOpenCLRuntime::~CGOpenCLRuntime() {} void CGOpenCLRuntime::EmitWorkGroupLocalVarDecl(CodeGenFunction &CGF, const VarDecl &D) { return CGF.EmitStaticVarDecl(D, llvm::GlobalValue::InternalLinkage); } llvm::Type *CGOpenCLRuntime::convertOpenCLSpecificType(const Type *T) { assert(T->isOpenCLSpecificType() && "Not an OpenCL specific type!"); llvm::LLVMContext& Ctx = CGM.getLLVMContext(); uint32_t AddrSpc = CGM.getContext().getTargetAddressSpace( CGM.getContext().getOpenCLTypeAddrSpace(T)); switch (cast(T)->getKind()) { default: llvm_unreachable("Unexpected opencl builtin type!"); return nullptr; #define IMAGE_TYPE(ImgType, Id, SingletonId, Access, Suffix) \ case BuiltinType::Id: \ return llvm::PointerType::get( \ llvm::StructType::create(Ctx, "opencl." #ImgType "_" #Suffix "_t"), \ AddrSpc); #include "clang/Basic/OpenCLImageTypes.def" case BuiltinType::OCLSampler: return getSamplerType(T); case BuiltinType::OCLEvent: return llvm::PointerType::get( llvm::StructType::create(Ctx, "opencl.event_t"), AddrSpc); case BuiltinType::OCLClkEvent: return llvm::PointerType::get( llvm::StructType::create(Ctx, "opencl.clk_event_t"), AddrSpc); case BuiltinType::OCLQueue: return llvm::PointerType::get( llvm::StructType::create(Ctx, "opencl.queue_t"), AddrSpc); case BuiltinType::OCLReserveID: return llvm::PointerType::get( llvm::StructType::create(Ctx, "opencl.reserve_id_t"), AddrSpc); } } llvm::Type *CGOpenCLRuntime::getPipeType(const PipeType *T) { if (T->isReadOnly()) return getPipeType(T, "opencl.pipe_ro_t", PipeROTy); else return getPipeType(T, "opencl.pipe_wo_t", PipeWOTy); } llvm::Type *CGOpenCLRuntime::getPipeType(const PipeType *T, StringRef Name, llvm::Type *&PipeTy) { if (!PipeTy) PipeTy = llvm::PointerType::get(llvm::StructType::create( CGM.getLLVMContext(), Name), CGM.getContext().getTargetAddressSpace( CGM.getContext().getOpenCLTypeAddrSpace(T))); return PipeTy; } llvm::PointerType *CGOpenCLRuntime::getSamplerType(const Type *T) { if (!SamplerTy) SamplerTy = llvm::PointerType::get(llvm::StructType::create( CGM.getLLVMContext(), "opencl.sampler_t"), CGM.getContext().getTargetAddressSpace( CGM.getContext().getOpenCLTypeAddrSpace(T))); return SamplerTy; } llvm::Value *CGOpenCLRuntime::getPipeElemSize(const Expr *PipeArg) { const PipeType *PipeTy = PipeArg->getType()->getAs(); // The type of the last (implicit) argument to be passed. llvm::Type *Int32Ty = llvm::IntegerType::getInt32Ty(CGM.getLLVMContext()); unsigned TypeSize = CGM.getContext() .getTypeSizeInChars(PipeTy->getElementType()) .getQuantity(); return llvm::ConstantInt::get(Int32Ty, TypeSize, false); } llvm::Value *CGOpenCLRuntime::getPipeElemAlign(const Expr *PipeArg) { const PipeType *PipeTy = PipeArg->getType()->getAs(); // The type of the last (implicit) argument to be passed. llvm::Type *Int32Ty = llvm::IntegerType::getInt32Ty(CGM.getLLVMContext()); unsigned TypeSize = CGM.getContext() .getTypeAlignInChars(PipeTy->getElementType()) .getQuantity(); return llvm::ConstantInt::get(Int32Ty, TypeSize, false); } llvm::PointerType *CGOpenCLRuntime::getGenericVoidPointerType() { assert(CGM.getLangOpts().OpenCL); return llvm::IntegerType::getInt8PtrTy( CGM.getLLVMContext(), CGM.getContext().getTargetAddressSpace(LangAS::opencl_generic)); } // Get the block literal from an expression derived from the block expression. // OpenCL v2.0 s6.12.5: // Block variable declarations are implicitly qualified with const. Therefore // all block variables must be initialized at declaration time and may not be // reassigned. static const BlockExpr *getBlockExpr(const Expr *E) { if (auto Cast = dyn_cast(E)) { E = Cast->getSubExpr(); } if (auto DR = dyn_cast(E)) { E = cast(DR->getDecl())->getInit(); } E = E->IgnoreImplicit(); if (auto Cast = dyn_cast(E)) { E = Cast->getSubExpr(); } return cast(E); } /// Record emitted llvm invoke function and llvm block literal for the /// corresponding block expression. void CGOpenCLRuntime::recordBlockInfo(const BlockExpr *E, llvm::Function *InvokeF, llvm::Value *Block) { assert(EnqueuedBlockMap.find(E) == EnqueuedBlockMap.end() && "Block expression emitted twice"); assert(isa(InvokeF) && "Invalid invoke function"); assert(Block->getType()->isPointerTy() && "Invalid block literal type"); EnqueuedBlockMap[E].InvokeFunc = InvokeF; EnqueuedBlockMap[E].BlockArg = Block; EnqueuedBlockMap[E].Kernel = nullptr; } llvm::Function *CGOpenCLRuntime::getInvokeFunction(const Expr *E) { return EnqueuedBlockMap[getBlockExpr(E)].InvokeFunc; } CGOpenCLRuntime::EnqueuedBlockInfo CGOpenCLRuntime::emitOpenCLEnqueuedBlock(CodeGenFunction &CGF, const Expr *E) { CGF.EmitScalarExpr(E); const BlockExpr *Block = getBlockExpr(E); assert(EnqueuedBlockMap.find(Block) != EnqueuedBlockMap.end() && "Block expression not emitted"); // Do not emit the block wrapper again if it has been emitted. if (EnqueuedBlockMap[Block].Kernel) { return EnqueuedBlockMap[Block]; } auto *F = CGF.getTargetHooks().createEnqueuedBlockKernel( CGF, EnqueuedBlockMap[Block].InvokeFunc, EnqueuedBlockMap[Block].BlockArg->stripPointerCasts()); // The common part of the post-processing of the kernel goes here. F->addFnAttr(llvm::Attribute::NoUnwind); F->setCallingConv( CGF.getTypes().ClangCallConvToLLVMCallConv(CallingConv::CC_OpenCLKernel)); EnqueuedBlockMap[Block].Kernel = F; return EnqueuedBlockMap[Block]; }