This allow lowering to support scf.for and scf.if with results. As right now spv region operations don't have return value the results are demoted to Function memory. We create one allocation per result right before the region and store the yield values in it. Then we can load back the value from allocation to be able to use the results. Differential Revision: https://reviews.llvm.org/D82246
74 lines
2.9 KiB
C++
74 lines
2.9 KiB
C++
//===- ConvertGPUToSPIRVPass.cpp - GPU to SPIR-V dialect lowering passes --===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file implements a pass to convert a kernel function in the GPU Dialect
|
|
// into a spv.module operation
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "mlir/Conversion/GPUToSPIRV/ConvertGPUToSPIRVPass.h"
|
|
#include "../PassDetail.h"
|
|
#include "mlir/Conversion/GPUToSPIRV/ConvertGPUToSPIRV.h"
|
|
#include "mlir/Conversion/SCFToSPIRV/SCFToSPIRV.h"
|
|
#include "mlir/Conversion/StandardToSPIRV/ConvertStandardToSPIRV.h"
|
|
#include "mlir/Dialect/GPU/GPUDialect.h"
|
|
#include "mlir/Dialect/SCF/SCF.h"
|
|
#include "mlir/Dialect/SPIRV/SPIRVDialect.h"
|
|
#include "mlir/Dialect/SPIRV/SPIRVLowering.h"
|
|
#include "mlir/Dialect/SPIRV/SPIRVOps.h"
|
|
|
|
using namespace mlir;
|
|
|
|
namespace {
|
|
/// Pass to lower GPU Dialect to SPIR-V. The pass only converts the gpu.func ops
|
|
/// inside gpu.module ops. i.e., the function that are referenced in
|
|
/// gpu.launch_func ops. For each such function
|
|
///
|
|
/// 1) Create a spirv::ModuleOp, and clone the function into spirv::ModuleOp
|
|
/// (the original function is still needed by the gpu::LaunchKernelOp, so cannot
|
|
/// replace it).
|
|
///
|
|
/// 2) Lower the body of the spirv::ModuleOp.
|
|
struct GPUToSPIRVPass : public ConvertGPUToSPIRVBase<GPUToSPIRVPass> {
|
|
void runOnOperation() override;
|
|
};
|
|
} // namespace
|
|
|
|
void GPUToSPIRVPass::runOnOperation() {
|
|
MLIRContext *context = &getContext();
|
|
ModuleOp module = getOperation();
|
|
|
|
SmallVector<Operation *, 1> kernelModules;
|
|
OpBuilder builder(context);
|
|
module.walk([&builder, &kernelModules](gpu::GPUModuleOp moduleOp) {
|
|
// For each kernel module (should be only 1 for now, but that is not a
|
|
// requirement here), clone the module for conversion because the
|
|
// gpu.launch function still needs the kernel module.
|
|
builder.setInsertionPoint(moduleOp.getOperation());
|
|
kernelModules.push_back(builder.clone(*moduleOp.getOperation()));
|
|
});
|
|
|
|
auto targetAttr = spirv::lookupTargetEnvOrDefault(module);
|
|
std::unique_ptr<ConversionTarget> target =
|
|
spirv::SPIRVConversionTarget::get(targetAttr);
|
|
|
|
SPIRVTypeConverter typeConverter(targetAttr);
|
|
ScfToSPIRVContext scfContext;
|
|
OwningRewritePatternList patterns;
|
|
populateGPUToSPIRVPatterns(context, typeConverter, patterns);
|
|
populateSCFToSPIRVPatterns(context, typeConverter,scfContext, patterns);
|
|
populateStandardToSPIRVPatterns(context, typeConverter, patterns);
|
|
|
|
if (failed(applyFullConversion(kernelModules, *target, patterns)))
|
|
return signalPassFailure();
|
|
}
|
|
|
|
std::unique_ptr<OperationPass<ModuleOp>> mlir::createConvertGPUToSPIRVPass() {
|
|
return std::make_unique<GPUToSPIRVPass>();
|
|
}
|