summaryrefslogtreecommitdiffstats
path: root/mlir/lib/Dialect/GPU
diff options
context:
space:
mode:
authorStephan Herhut <herhut@google.com>2019-09-09 01:15:10 -0700
committerA. Unique TensorFlower <gardener@tensorflow.org>2019-09-09 01:15:47 -0700
commit318ff019cf703ece10df791b2da8307f3248baee (patch)
tree387d31dcd0bac1b0a4a2b800b11d7f7e47a93ffa /mlir/lib/Dialect/GPU
parent42b60d34fc3dfbad2b26568cf1cd903685df3a3e (diff)
downloadbcm5719-llvm-318ff019cf703ece10df791b2da8307f3248baee.tar.gz
bcm5719-llvm-318ff019cf703ece10df791b2da8307f3248baee.zip
Addressing some late review comments on kernel inlining.
Just formatting and better lit tests, no functional change. PiperOrigin-RevId: 267942907
Diffstat (limited to 'mlir/lib/Dialect/GPU')
-rw-r--r--mlir/lib/Dialect/GPU/Transforms/KernelOutlining.cpp30
1 files changed, 15 insertions, 15 deletions
diff --git a/mlir/lib/Dialect/GPU/Transforms/KernelOutlining.cpp b/mlir/lib/Dialect/GPU/Transforms/KernelOutlining.cpp
index f464b091fc8..26449f6e6f1 100644
--- a/mlir/lib/Dialect/GPU/Transforms/KernelOutlining.cpp
+++ b/mlir/lib/Dialect/GPU/Transforms/KernelOutlining.cpp
@@ -74,22 +74,22 @@ static gpu::LaunchFuncOp inlineConstants(FuncOp kernelFunc,
firstBlock.getArgument(i)->replaceAllUsesWith(newConstant->getResult(0));
firstBlock.eraseArgument(i);
}
- if (newLaunchArgs.size() != launch.getNumKernelOperands()) {
- std::reverse(newLaunchArgs.begin(), newLaunchArgs.end());
- OpBuilder LaunchBuilder(launch);
- SmallVector<Type, 8> newArgumentTypes;
- newArgumentTypes.reserve(firstBlock.getNumArguments());
- for (auto value : firstBlock.getArguments()) {
- newArgumentTypes.push_back(value->getType());
- }
- kernelFunc.setType(LaunchBuilder.getFunctionType(newArgumentTypes, {}));
- auto newLaunch = LaunchBuilder.create<gpu::LaunchFuncOp>(
- launch.getLoc(), kernelFunc, launch.getGridSizeOperandValues(),
- launch.getBlockSizeOperandValues(), newLaunchArgs);
- launch.erase();
- return newLaunch;
+ if (newLaunchArgs.size() == launch.getNumKernelOperands())
+ return launch;
+
+ std::reverse(newLaunchArgs.begin(), newLaunchArgs.end());
+ OpBuilder LaunchBuilder(launch);
+ SmallVector<Type, 8> newArgumentTypes;
+ newArgumentTypes.reserve(firstBlock.getNumArguments());
+ for (auto value : firstBlock.getArguments()) {
+ newArgumentTypes.push_back(value->getType());
}
- return launch;
+ kernelFunc.setType(LaunchBuilder.getFunctionType(newArgumentTypes, {}));
+ auto newLaunch = LaunchBuilder.create<gpu::LaunchFuncOp>(
+ launch.getLoc(), kernelFunc, launch.getGridSizeOperandValues(),
+ launch.getBlockSizeOperandValues(), newLaunchArgs);
+ launch.erase();
+ return newLaunch;
}
// Outline the `gpu.launch` operation body into a kernel function. Replace
OpenPOWER on IntegriCloud