summaryrefslogtreecommitdiffstats
path: root/mlir/lib/Target/LLVMIR/ConvertToROCDLIR.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'mlir/lib/Target/LLVMIR/ConvertToROCDLIR.cpp')
-rw-r--r--mlir/lib/Target/LLVMIR/ConvertToROCDLIR.cpp110
1 files changed, 110 insertions, 0 deletions
diff --git a/mlir/lib/Target/LLVMIR/ConvertToROCDLIR.cpp b/mlir/lib/Target/LLVMIR/ConvertToROCDLIR.cpp
new file mode 100644
index 00000000000..881d165e0c8
--- /dev/null
+++ b/mlir/lib/Target/LLVMIR/ConvertToROCDLIR.cpp
@@ -0,0 +1,110 @@
+//===- ConvertToROCDLIR.cpp - MLIR to LLVM IR conversion ------------------===//
+//
+// Part of the MLIR Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+//
+// This file implements a translation between the MLIR LLVM + ROCDL dialects and
+// LLVM IR with ROCDL intrinsics and metadata.
+//
+//===----------------------------------------------------------------------===//
+
+#include "mlir/Target/ROCDLIR.h"
+
+#include "mlir/Dialect/GPU/GPUDialect.h"
+#include "mlir/Dialect/LLVMIR/LLVMDialect.h"
+#include "mlir/Dialect/LLVMIR/ROCDLDialect.h"
+#include "mlir/IR/Function.h"
+#include "mlir/IR/Module.h"
+#include "mlir/Target/LLVMIR/ModuleTranslation.h"
+#include "mlir/Translation.h"
+
+#include "llvm/ADT/StringRef.h"
+#include "llvm/IR/IntrinsicsAMDGPU.h"
+#include "llvm/IR/Module.h"
+#include "llvm/Support/ToolOutputFile.h"
+
+using namespace mlir;
+
+// Create a call to llvm intrinsic
+static llvm::Value *createIntrinsicCall(llvm::IRBuilder<> &builder,
+ llvm::Intrinsic::ID intrinsic,
+ ArrayRef<llvm::Value *> args = {}) {
+ llvm::Module *module = builder.GetInsertBlock()->getModule();
+ llvm::Function *fn = llvm::Intrinsic::getDeclaration(module, intrinsic);
+ return builder.CreateCall(fn, args);
+}
+
+// Create a call to ROCm-Device-Library function
+// Currently this routine will work only for calling ROCDL functions that
+// take a single int32 argument. It is likely that the interface of this
+// function will change to make it more generic.
+static llvm::Value *createDeviceFunctionCall(llvm::IRBuilder<> &builder,
+ StringRef fn_name, int parameter) {
+ llvm::Module *module = builder.GetInsertBlock()->getModule();
+ llvm::FunctionType *function_type = llvm::FunctionType::get(
+ llvm::Type::getInt64Ty(module->getContext()), // return type.
+ llvm::Type::getInt32Ty(module->getContext()), // parameter type.
+ false); // no variadic arguments.
+ llvm::Function *fn = dyn_cast<llvm::Function>(
+ module->getOrInsertFunction(fn_name, function_type).getCallee());
+ llvm::Value *fn_op0 = llvm::ConstantInt::get(
+ llvm::Type::getInt32Ty(module->getContext()), parameter);
+ return builder.CreateCall(fn, ArrayRef<llvm::Value *>(fn_op0));
+}
+
+namespace {
+class ModuleTranslation : public LLVM::ModuleTranslation {
+
+public:
+ explicit ModuleTranslation(Operation *module)
+ : LLVM::ModuleTranslation(module) {}
+ ~ModuleTranslation() override {}
+
+protected:
+ LogicalResult convertOperation(Operation &opInst,
+ llvm::IRBuilder<> &builder) override {
+
+#include "mlir/Dialect/LLVMIR/ROCDLConversions.inc"
+
+ return LLVM::ModuleTranslation::convertOperation(opInst, builder);
+ }
+};
+} // namespace
+
+std::unique_ptr<llvm::Module> mlir::translateModuleToROCDLIR(Operation *m) {
+ ModuleTranslation translation(m);
+
+ // lower MLIR (with RODL Dialect) to LLVM IR (with ROCDL intrinsics)
+ auto llvmModule =
+ LLVM::ModuleTranslation::translateModule<ModuleTranslation>(m);
+
+ // foreach GPU kernel
+ // 1. Insert AMDGPU_KERNEL calling convention.
+ // 2. Insert amdgpu-flat-workgroup-size(1, 1024) attribute.
+ for (auto func :
+ ModuleTranslation::getModuleBody(m).getOps<LLVM::LLVMFuncOp>()) {
+ if (!func.getAttrOfType<UnitAttr>(gpu::GPUDialect::getKernelFuncAttrName()))
+ continue;
+
+ auto *llvmFunc = llvmModule->getFunction(func.getName());
+
+ llvmFunc->setCallingConv(llvm::CallingConv::AMDGPU_KERNEL);
+
+ llvmFunc->addFnAttr("amdgpu-flat-work-group-size", "1, 1024");
+ }
+
+ return llvmModule;
+}
+
+static TranslateFromMLIRRegistration
+ registration("mlir-to-rocdlir", [](ModuleOp module, raw_ostream &output) {
+ auto llvmModule = mlir::translateModuleToROCDLIR(module);
+ if (!llvmModule)
+ return failure();
+
+ llvmModule->print(output, nullptr);
+ return success();
+ });
OpenPOWER on IntegriCloud