//===- ConvertGPUToSPIRV.cpp - Convert GPU ops to SPIR-V dialect ----------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This file implements the conversion patterns from GPU ops to SPIR-V dialect. // //===----------------------------------------------------------------------===// #include "mlir/Conversion/GPUToSPIRV/ConvertGPUToSPIRV.h" #include "mlir/Dialect/GPU/GPUDialect.h" #include "mlir/Dialect/LoopOps/LoopOps.h" #include "mlir/Dialect/SPIRV/SPIRVDialect.h" #include "mlir/Dialect/SPIRV/SPIRVLowering.h" #include "mlir/Dialect/SPIRV/SPIRVOps.h" #include "mlir/IR/Module.h" using namespace mlir; namespace { /// Pattern to convert a loop::ForOp within kernel functions into spirv::LoopOp. class ForOpConversion final : public SPIRVOpLowering { public: using SPIRVOpLowering::SPIRVOpLowering; LogicalResult matchAndRewrite(loop::ForOp forOp, ArrayRef operands, ConversionPatternRewriter &rewriter) const override; }; /// Pattern to convert a loop::IfOp within kernel functions into /// spirv::SelectionOp. class IfOpConversion final : public SPIRVOpLowering { public: using SPIRVOpLowering::SPIRVOpLowering; LogicalResult matchAndRewrite(loop::IfOp IfOp, ArrayRef operands, ConversionPatternRewriter &rewriter) const override; }; /// Pattern to erase a loop::YieldOp. class TerminatorOpConversion final : public SPIRVOpLowering { public: using SPIRVOpLowering::SPIRVOpLowering; LogicalResult matchAndRewrite(loop::YieldOp terminatorOp, ArrayRef operands, ConversionPatternRewriter &rewriter) const override { rewriter.eraseOp(terminatorOp); return success(); } }; /// Pattern lowering GPU block/thread size/id to loading SPIR-V invocation /// builin variables. template class LaunchConfigConversion : public SPIRVOpLowering { public: using SPIRVOpLowering::SPIRVOpLowering; LogicalResult matchAndRewrite(SourceOp op, ArrayRef operands, ConversionPatternRewriter &rewriter) const override; }; /// This is separate because in Vulkan workgroup size is exposed to shaders via /// a constant with WorkgroupSize decoration. So here we cannot generate a /// builtin variable; instead the information in the `spv.entry_point_abi` /// attribute on the surrounding FuncOp is used to replace the gpu::BlockDimOp. class WorkGroupSizeConversion : public SPIRVOpLowering { public: using SPIRVOpLowering::SPIRVOpLowering; LogicalResult matchAndRewrite(gpu::BlockDimOp op, ArrayRef operands, ConversionPatternRewriter &rewriter) const override; }; /// Pattern to convert a kernel function in GPU dialect within a spv.module. class GPUFuncOpConversion final : public SPIRVOpLowering { public: using SPIRVOpLowering::SPIRVOpLowering; LogicalResult matchAndRewrite(gpu::GPUFuncOp funcOp, ArrayRef operands, ConversionPatternRewriter &rewriter) const override; private: SmallVector workGroupSizeAsInt32; }; /// Pattern to convert a gpu.module to a spv.module. class GPUModuleConversion final : public SPIRVOpLowering { public: using SPIRVOpLowering::SPIRVOpLowering; LogicalResult matchAndRewrite(gpu::GPUModuleOp moduleOp, ArrayRef operands, ConversionPatternRewriter &rewriter) const override; }; /// Pattern to convert a gpu.return into a SPIR-V return. // TODO: This can go to DRR when GPU return has operands. class GPUReturnOpConversion final : public SPIRVOpLowering { public: using SPIRVOpLowering::SPIRVOpLowering; LogicalResult matchAndRewrite(gpu::ReturnOp returnOp, ArrayRef operands, ConversionPatternRewriter &rewriter) const override; }; } // namespace //===----------------------------------------------------------------------===// // loop::ForOp. //===----------------------------------------------------------------------===// LogicalResult ForOpConversion::matchAndRewrite(loop::ForOp forOp, ArrayRef operands, ConversionPatternRewriter &rewriter) const { // loop::ForOp can be lowered to the structured control flow represented by // spirv::LoopOp by making the continue block of the spirv::LoopOp the loop // latch and the merge block the exit block. The resulting spirv::LoopOp has a // single back edge from the continue to header block, and a single exit from // header to merge. loop::ForOpOperandAdaptor forOperands(operands); auto loc = forOp.getLoc(); auto loopControl = rewriter.getI32IntegerAttr( static_cast(spirv::LoopControl::None)); auto loopOp = rewriter.create(loc, loopControl); loopOp.addEntryAndMergeBlock(); OpBuilder::InsertionGuard guard(rewriter); // Create the block for the header. auto header = new Block(); // Insert the header. loopOp.body().getBlocks().insert(std::next(loopOp.body().begin(), 1), header); // Create the new induction variable to use. BlockArgument newIndVar = header->addArgument(forOperands.lowerBound().getType()); Block *body = forOp.getBody(); // Apply signature conversion to the body of the forOp. It has a single block, // with argument which is the induction variable. That has to be replaced with // the new induction variable. TypeConverter::SignatureConversion signatureConverter( body->getNumArguments()); signatureConverter.remapInput(0, newIndVar); body = rewriter.applySignatureConversion(&forOp.getLoopBody(), signatureConverter); // Delete the loop terminator. rewriter.eraseOp(body->getTerminator()); // Move the blocks from the forOp into the loopOp. This is the body of the // loopOp. rewriter.inlineRegionBefore(forOp.getOperation()->getRegion(0), loopOp.body(), std::next(loopOp.body().begin(), 2)); // Branch into it from the entry. rewriter.setInsertionPointToEnd(&(loopOp.body().front())); rewriter.create(loc, header, forOperands.lowerBound()); // Generate the rest of the loop header. rewriter.setInsertionPointToEnd(header); auto mergeBlock = loopOp.getMergeBlock(); auto cmpOp = rewriter.create( loc, rewriter.getI1Type(), newIndVar, forOperands.upperBound()); rewriter.create( loc, cmpOp, body, ArrayRef(), mergeBlock, ArrayRef()); // Generate instructions to increment the step of the induction variable and // branch to the header. Block *continueBlock = loopOp.getContinueBlock(); rewriter.setInsertionPointToEnd(continueBlock); // Add the step to the induction variable and branch to the header. Value updatedIndVar = rewriter.create( loc, newIndVar.getType(), newIndVar, forOperands.step()); rewriter.create(loc, header, updatedIndVar); rewriter.eraseOp(forOp); return success(); } //===----------------------------------------------------------------------===// // loop::IfOp. //===----------------------------------------------------------------------===// LogicalResult IfOpConversion::matchAndRewrite(loop::IfOp ifOp, ArrayRef operands, ConversionPatternRewriter &rewriter) const { // When lowering `loop::IfOp` we explicitly create a selection header block // before the control flow diverges and a merge block where control flow // subsequently converges. loop::IfOpOperandAdaptor ifOperands(operands); auto loc = ifOp.getLoc(); // Create `spv.selection` operation, selection header block and merge block. auto selectionControl = rewriter.getI32IntegerAttr( static_cast(spirv::SelectionControl::None)); auto selectionOp = rewriter.create(loc, selectionControl); selectionOp.addMergeBlock(); auto *mergeBlock = selectionOp.getMergeBlock(); OpBuilder::InsertionGuard guard(rewriter); auto *selectionHeaderBlock = new Block(); selectionOp.body().getBlocks().push_front(selectionHeaderBlock); // Inline `then` region before the merge block and branch to it. auto &thenRegion = ifOp.thenRegion(); auto *thenBlock = &thenRegion.front(); rewriter.setInsertionPointToEnd(&thenRegion.back()); rewriter.create(loc, mergeBlock); rewriter.inlineRegionBefore(thenRegion, mergeBlock); auto *elseBlock = mergeBlock; // If `else` region is not empty, inline that region before the merge block // and branch to it. if (!ifOp.elseRegion().empty()) { auto &elseRegion = ifOp.elseRegion(); elseBlock = &elseRegion.front(); rewriter.setInsertionPointToEnd(&elseRegion.back()); rewriter.create(loc, mergeBlock); rewriter.inlineRegionBefore(elseRegion, mergeBlock); } // Create a `spv.BranchConditional` operation for selection header block. rewriter.setInsertionPointToEnd(selectionHeaderBlock); rewriter.create(loc, ifOperands.condition(), thenBlock, ArrayRef(), elseBlock, ArrayRef()); rewriter.eraseOp(ifOp); return success(); } //===----------------------------------------------------------------------===// // Builtins. //===----------------------------------------------------------------------===// static Optional getLaunchConfigIndex(Operation *op) { auto dimAttr = op->getAttrOfType("dimension"); if (!dimAttr) { return {}; } if (dimAttr.getValue() == "x") { return 0; } else if (dimAttr.getValue() == "y") { return 1; } else if (dimAttr.getValue() == "z") { return 2; } return {}; } template LogicalResult LaunchConfigConversion::matchAndRewrite( SourceOp op, ArrayRef operands, ConversionPatternRewriter &rewriter) const { auto index = getLaunchConfigIndex(op); if (!index) return failure(); // SPIR-V invocation builtin variables are a vector of type <3xi32> auto spirvBuiltin = spirv::getBuiltinVariableValue(op, builtin, rewriter); rewriter.replaceOpWithNewOp( op, rewriter.getIntegerType(32), spirvBuiltin, rewriter.getI32ArrayAttr({index.getValue()})); return success(); } LogicalResult WorkGroupSizeConversion::matchAndRewrite( gpu::BlockDimOp op, ArrayRef operands, ConversionPatternRewriter &rewriter) const { auto index = getLaunchConfigIndex(op); if (!index) return failure(); auto workGroupSizeAttr = spirv::lookupLocalWorkGroupSize(op); auto val = workGroupSizeAttr.getValue(index.getValue()); auto convertedType = typeConverter.convertType(op.getResult().getType()); if (!convertedType) return failure(); rewriter.replaceOpWithNewOp( op, convertedType, IntegerAttr::get(convertedType, val)); return success(); } //===----------------------------------------------------------------------===// // GPUFuncOp //===----------------------------------------------------------------------===// // Legalizes a GPU function as an entry SPIR-V function. static spirv::FuncOp lowerAsEntryFunction(gpu::GPUFuncOp funcOp, SPIRVTypeConverter &typeConverter, ConversionPatternRewriter &rewriter, spirv::EntryPointABIAttr entryPointInfo, ArrayRef argABIInfo) { auto fnType = funcOp.getType(); if (fnType.getNumResults()) { funcOp.emitError("SPIR-V lowering only supports entry functions" "with no return values right now"); return nullptr; } if (fnType.getNumInputs() != argABIInfo.size()) { funcOp.emitError( "lowering as entry functions requires ABI info for all arguments"); return nullptr; } // Update the signature to valid SPIR-V types and add the ABI // attributes. These will be "materialized" by using the // LowerABIAttributesPass. TypeConverter::SignatureConversion signatureConverter(fnType.getNumInputs()); { for (auto argType : enumerate(funcOp.getType().getInputs())) { auto convertedType = typeConverter.convertType(argType.value()); signatureConverter.addInputs(argType.index(), convertedType); } } auto newFuncOp = rewriter.create( funcOp.getLoc(), funcOp.getName(), rewriter.getFunctionType(signatureConverter.getConvertedTypes(), llvm::None)); for (const auto &namedAttr : funcOp.getAttrs()) { if (namedAttr.first.is(impl::getTypeAttrName()) || namedAttr.first.is(SymbolTable::getSymbolAttrName())) continue; newFuncOp.setAttr(namedAttr.first, namedAttr.second); } rewriter.inlineRegionBefore(funcOp.getBody(), newFuncOp.getBody(), newFuncOp.end()); rewriter.applySignatureConversion(&newFuncOp.getBody(), signatureConverter); rewriter.eraseOp(funcOp); spirv::setABIAttrs(newFuncOp, entryPointInfo, argABIInfo); return newFuncOp; } LogicalResult GPUFuncOpConversion::matchAndRewrite( gpu::GPUFuncOp funcOp, ArrayRef operands, ConversionPatternRewriter &rewriter) const { if (!gpu::GPUDialect::isKernel(funcOp)) return failure(); SmallVector argABI; for (auto argIndex : llvm::seq(0, funcOp.getNumArguments())) { // If the ABI is already specified, use it. auto abiAttr = funcOp.getArgAttrOfType( argIndex, spirv::getInterfaceVarABIAttrName()); if (abiAttr) { argABI.push_back(abiAttr); continue; } // todo(ravishankarm): Use the "default ABI". Remove this in a follow up // CL. Staging this to make this easy to revert in case of breakages out of // tree. Optional sc; if (funcOp.getArgument(argIndex).getType().isIntOrIndexOrFloat()) sc = spirv::StorageClass::StorageBuffer; argABI.push_back( spirv::getInterfaceVarABIAttr(0, argIndex, sc, rewriter.getContext())); } auto entryPointAttr = spirv::lookupEntryPointABI(funcOp); if (!entryPointAttr) { funcOp.emitRemark("match failure: missing 'spv.entry_point_abi' attribute"); return failure(); } spirv::FuncOp newFuncOp = lowerAsEntryFunction( funcOp, typeConverter, rewriter, entryPointAttr, argABI); if (!newFuncOp) return failure(); newFuncOp.removeAttr(Identifier::get(gpu::GPUDialect::getKernelFuncAttrName(), rewriter.getContext())); return success(); } //===----------------------------------------------------------------------===// // ModuleOp with gpu.module. //===----------------------------------------------------------------------===// LogicalResult GPUModuleConversion::matchAndRewrite( gpu::GPUModuleOp moduleOp, ArrayRef operands, ConversionPatternRewriter &rewriter) const { auto spvModule = rewriter.create( moduleOp.getLoc(), spirv::AddressingModel::Logical, spirv::MemoryModel::GLSL450); // Move the region from the module op into the SPIR-V module. Region &spvModuleRegion = spvModule.body(); rewriter.inlineRegionBefore(moduleOp.body(), spvModuleRegion, spvModuleRegion.begin()); // The spv.module build method adds a block with a terminator. Remove that // block. The terminator of the module op in the remaining block will be // legalized later. spvModuleRegion.back().erase(); rewriter.eraseOp(moduleOp); return success(); } //===----------------------------------------------------------------------===// // GPU return inside kernel functions to SPIR-V return. //===----------------------------------------------------------------------===// LogicalResult GPUReturnOpConversion::matchAndRewrite( gpu::ReturnOp returnOp, ArrayRef operands, ConversionPatternRewriter &rewriter) const { if (!operands.empty()) return failure(); rewriter.replaceOpWithNewOp(returnOp); return success(); } //===----------------------------------------------------------------------===// // GPU To SPIRV Patterns. //===----------------------------------------------------------------------===// namespace { #include "GPUToSPIRV.cpp.inc" } void mlir::populateGPUToSPIRVPatterns(MLIRContext *context, SPIRVTypeConverter &typeConverter, OwningRewritePatternList &patterns) { populateWithGenerated(context, &patterns); patterns.insert< ForOpConversion, GPUFuncOpConversion, GPUModuleConversion, GPUReturnOpConversion, IfOpConversion, LaunchConfigConversion, LaunchConfigConversion, LaunchConfigConversion, TerminatorOpConversion, WorkGroupSizeConversion>(context, typeConverter); }