doxygen/WmmaOpsToSPIRV_8cpp_source.html

 //===------ WmmaOpsToSPIRV.cpp - WMMA LD/ST/Compute to SPIRV lowering -----===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//

 //

 // This file contains definitions of patterns to lower GPU Subgroup MMA ops to

 // SPIRV Cooperative Matrix ops.

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Conversion/GPUToSPIRV/GPUToSPIRV.h"

 #include "mlir/Conversion/GPUToSPIRV/GPUToSPIRVPass.h"

 #include "mlir/Dialect/GPU/IR/GPUDialect.h"

 #include "mlir/Dialect/SPIRV/IR/SPIRVAttributes.h"

 #include "mlir/Dialect/SPIRV/IR/SPIRVDialect.h"

 #include "mlir/Dialect/SPIRV/IR/SPIRVEnums.h"

 #include "mlir/Dialect/SPIRV/IR/SPIRVOps.h"

 #include "mlir/Dialect/SPIRV/IR/SPIRVTypes.h"

 #include "mlir/Dialect/SPIRV/IR/TargetAndABI.h"

 #include "mlir/Dialect/SPIRV/Transforms/SPIRVConversion.h"

 #include "mlir/IR/BuiltinAttributes.h"

 #include "mlir/IR/BuiltinTypes.h"

 #include "mlir/IR/TypeUtilities.h"

 #include "mlir/IR/ValueRange.h"

 #include "llvm/ADT/STLExtras.h"

 #include "llvm/ADT/StringSwitch.h"


 #include <cassert>


 namespace mlir {

 //===----------------------------------------------------------------------===//

 // Patterns and helpers.

 //===----------------------------------------------------------------------===//


 /// Creates a SPIR-V op to replace the given GPU subgroup mma elementwise op

 /// when the elementwise op directly supports with cooperative matrix type.

 /// Returns false if cannot.

 ///

 /// See SPV_KHR_cooperative_matrix for supported elementwise ops.

 static bool createElementwiseOp(ConversionPatternRewriter &builder,

                                 gpu::SubgroupMmaElementwiseOp op, Type coopType,

                                 ValueRange operands) {

   assert((isa<spirv::CooperativeMatrixType>(coopType)));


   switch (op.getOpType()) {

   case gpu::MMAElementwiseOp::ADDF:

     builder.replaceOpWithNewOp<spirv::FAddOp>(op, coopType, operands);

     return true;

   case gpu::MMAElementwiseOp::ADDI:

     builder.replaceOpWithNewOp<spirv::IAddOp>(op, coopType, operands);

     return true;

   case gpu::MMAElementwiseOp::SUBF:

     builder.replaceOpWithNewOp<spirv::FSubOp>(op, coopType, operands);

     return true;

   case gpu::MMAElementwiseOp::SUBI:

     builder.replaceOpWithNewOp<spirv::ISubOp>(op, coopType, operands);

     return true;

   case gpu::MMAElementwiseOp::DIVF:

     builder.replaceOpWithNewOp<spirv::FDivOp>(op, coopType, operands);

     return true;

   case gpu::MMAElementwiseOp::DIVS:

     builder.replaceOpWithNewOp<spirv::SDivOp>(op, coopType, operands);

     return true;

   case gpu::MMAElementwiseOp::DIVU:

     builder.replaceOpWithNewOp<spirv::UDivOp>(op, coopType, operands);

     return true;

   case gpu::MMAElementwiseOp::NEGATEF:

     builder.replaceOpWithNewOp<spirv::FNegateOp>(op, coopType, operands);

     return true;

   case gpu::MMAElementwiseOp::NEGATES:

     builder.replaceOpWithNewOp<spirv::SNegateOp>(op, coopType, operands);

     return true;

   case gpu::MMAElementwiseOp::EXTF:

     builder.replaceOpWithNewOp<spirv::FConvertOp>(op, coopType, operands);

     return true;

   default:

     break;

   }

   return false;

 }


 bool allOperandsHaveSameCoopMatrixType(ValueRange operands) {

   assert(!operands.empty());

   if (!llvm::all_equal(

           llvm::map_range(operands, [](Value v) { return v.getType(); })))

     return false;


   return isa<spirv::CooperativeMatrixType>(operands.front().getType());

 }


 namespace {

 /// Converts GPU MMA ConstantMatrixOp to constant SPIR-V KHR/NV cooperative

 /// matrix ops.

 struct WmmaConstantOpToSPIRVLowering final

     : OpConversionPattern<gpu::SubgroupMmaConstantMatrixOp> {

   using OpConversionPattern::OpConversionPattern;


   LogicalResult

   matchAndRewrite(gpu::SubgroupMmaConstantMatrixOp op, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     assert(adaptor.getOperands().size() == 1);

     Value cst = adaptor.getOperands().front();

     auto coopType = getTypeConverter()->convertType(op.getType());

     if (!coopType)

       return rewriter.notifyMatchFailure(op, "type conversion failed");


     rewriter.replaceOpWithNewOp<spirv::CompositeConstructOp>(op, coopType, cst);

     return success();

   }

 };


 /// Converts elementwise ops to SPIR-V cooperative matrix elementwise ops for

 /// the default case.

 struct WmmaElementwiseOpToSPIRVDefaultLowering final

     : OpConversionPattern<gpu::SubgroupMmaElementwiseOp> {

   using OpConversionPattern::OpConversionPattern;


   LogicalResult

   matchAndRewrite(gpu::SubgroupMmaElementwiseOp op, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     // All operands should be of cooperative matrix types.

     if (!allOperandsHaveSameCoopMatrixType(adaptor.getOperands())) {

       return rewriter.notifyMatchFailure(op,

                                          "not all operands are coop matrices");

     }


     auto coopType = getTypeConverter()->convertType(op.getType());

     if (!coopType)

       return rewriter.notifyMatchFailure(op, "type conversion failed");


     return success(

         createElementwiseOp(rewriter, op, coopType, adaptor.getOperands()));

   }

 };


 /// Converts elementwise ops to SPIR-V cooperative matrix elementwise ops for

 /// matrix times scalar case.

 struct WmmaElementwiseOpToSPIRVScalarMulLowering final

     : OpConversionPattern<gpu::SubgroupMmaElementwiseOp> {

   using OpConversionPattern::OpConversionPattern;


   LogicalResult

   matchAndRewrite(gpu::SubgroupMmaElementwiseOp op, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     if (adaptor.getOperands().size() != 2)

       return failure();


     // All operands should be of cooperative matrix types.

     if (!allOperandsHaveSameCoopMatrixType(adaptor.getOperands())) {

       return rewriter.notifyMatchFailure(op,

                                          "not all operands are coop matrices");

     }


     if (op.getOpType() != gpu::MMAElementwiseOp::MULF)

       return failure();


     // Use the original operands to check whether one of the operands is a splat

     // scalar value.

     Value lhs = op.getOperands().front();

     Value rhs = op.getOperands().back();

     Value splat = nullptr;

     Value matrix = nullptr;

     if (lhs.getDefiningOp<gpu::SubgroupMmaConstantMatrixOp>()) {

       splat = adaptor.getOperands().front();

       matrix = adaptor.getOperands().back();

     } else if (rhs.getDefiningOp<gpu::SubgroupMmaConstantMatrixOp>()) {

       matrix = adaptor.getOperands().front();

       splat = adaptor.getOperands().back();

     }

     if (!splat || !matrix)

       return rewriter.notifyMatchFailure(op, "no splat operand");


     // Constant MMA matrix ops are converted to `spirv.CompositeConstruct` ops.

     Value scalar;

     auto cc = splat.getDefiningOp<spirv::CompositeConstructOp>();

     if (!cc) {

       return rewriter.notifyMatchFailure(op,

                                          "splat is not a composite construct");

     }


     assert(cc.getConstituents().size() == 1);

     scalar = cc.getConstituents().front();


     auto coopType = getTypeConverter()->convertType(op.getType());

     if (!coopType)

       return rewriter.notifyMatchFailure(op, "type conversion failed");

     rewriter.replaceOpWithNewOp<spirv::MatrixTimesScalarOp>(

         op, coopType, ValueRange{matrix, scalar});

     return success();

   }

 };

 } // namespace


 //===----------------------------------------------------------------------===//

 // SPV_KHR_cooperative_matrix

 //===----------------------------------------------------------------------===//


 namespace khr {

 namespace {


 /// Converts the GPU MMA loadOp to KHRCooperativeMatrixLoad op in the SPIRV

 /// dialect.

 struct WmmaLoadOpToSPIRVLowering final

     : OpConversionPattern<gpu::SubgroupMmaLoadMatrixOp> {

   using OpConversionPattern::OpConversionPattern;


   LogicalResult

   matchAndRewrite(gpu::SubgroupMmaLoadMatrixOp op, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     const auto &typeConverter = *getTypeConverter<SPIRVTypeConverter>();

     Location loc = op->getLoc();


     auto retType = cast<gpu::MMAMatrixType>(op.getRes().getType());

     MemRefType memrefType = op.getSrcMemref().getType();

     Value bufferPtr =

         spirv::getElementPtr(typeConverter, memrefType, adaptor.getSrcMemref(),

                              adaptor.getIndices(), loc, rewriter);


     auto coopType =

         typeConverter.convertType<spirv::CooperativeMatrixType>(retType);

     if (!coopType)

       return rewriter.notifyMatchFailure(op, "type conversion failed");


     int64_t stride = op.getLeadDimension().getSExtValue();

     IntegerType i32Type = rewriter.getI32Type();

     auto strideValue = rewriter.create<spirv::ConstantOp>(

         loc, i32Type, IntegerAttr::get(i32Type, stride));


     bool isColMajor = op.getTranspose().value_or(false);

     auto layout = isColMajor ? spirv::CooperativeMatrixLayoutKHR::ColumnMajor

                              : spirv::CooperativeMatrixLayoutKHR::RowMajor;


     rewriter.replaceOpWithNewOp<spirv::KHRCooperativeMatrixLoadOp>(

         op, coopType, bufferPtr, strideValue, layout);

     return success();

   }

 };


 /// Converts the GPU MMA StoreOp to KHRCooperativeMatrixStore op in the SPIRV

 /// dialect.

 struct WmmaStoreOpToSPIRVLowering final

     : OpConversionPattern<gpu::SubgroupMmaStoreMatrixOp> {

   using OpConversionPattern::OpConversionPattern;


   LogicalResult

   matchAndRewrite(gpu::SubgroupMmaStoreMatrixOp op, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     const auto &typeConverter = *getTypeConverter<SPIRVTypeConverter>();

     Location loc = op->getLoc();


     auto memrefType = cast<MemRefType>(op.getDstMemref().getType());

     Value bufferPtr =

         spirv::getElementPtr(typeConverter, memrefType, adaptor.getDstMemref(),

                              adaptor.getIndices(), loc, rewriter);


     int64_t stride = op.getLeadDimension().getSExtValue();

     IntegerType i32Type = rewriter.getI32Type();

     auto strideValue = rewriter.create<spirv::ConstantOp>(

         loc, i32Type, IntegerAttr::get(i32Type, stride));


     bool isColMajor = op.getTranspose().value_or(false);

     auto layout = isColMajor ? spirv::CooperativeMatrixLayoutKHR::ColumnMajor

                              : spirv::CooperativeMatrixLayoutKHR::RowMajor;


     rewriter.replaceOpWithNewOp<spirv::KHRCooperativeMatrixStoreOp>(

         op, bufferPtr, adaptor.getSrc(), strideValue, layout);

     return success();

   }

 };


 /// Converts GPU MMA Compute to KHRCooperativeMatrixMulAdd op in the SPIRV

 /// dialect.

 struct WmmaMmaOpToSPIRVLowering final

     : OpConversionPattern<gpu::SubgroupMmaComputeOp> {

   using OpConversionPattern::OpConversionPattern;


   LogicalResult

   matchAndRewrite(gpu::SubgroupMmaComputeOp subgroupMmaComputeOp,

                   OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     rewriter.replaceOpWithNewOp<spirv::KHRCooperativeMatrixMulAddOp>(

         subgroupMmaComputeOp, adaptor.getOpA(), adaptor.getOpB(),

         adaptor.getOpC());

     return success();

   }

 };


 } // namespace

 } // namespace khr

 } // namespace mlir


 void mlir::populateGpuWMMAToSPIRVCoopMatrixKHRConversionPatterns(

     SPIRVTypeConverter &converter, RewritePatternSet &patterns) {

   using namespace mlir;

   MLIRContext *context = patterns.getContext();

   patterns.add<khr::WmmaLoadOpToSPIRVLowering, khr::WmmaMmaOpToSPIRVLowering,

                khr::WmmaStoreOpToSPIRVLowering, WmmaConstantOpToSPIRVLowering,

                WmmaElementwiseOpToSPIRVDefaultLowering>(converter, context);

   // Give the following patterns higher benefit to prevail over the default one.

   patterns.add<WmmaElementwiseOpToSPIRVScalarMulLowering>(converter, context,

                                                           /*benefit=*/2);

 }


 void mlir::populateMMAToSPIRVCoopMatrixTypeConversion(

     mlir::SPIRVTypeConverter &typeConverter) {

   typeConverter.addConversion([](gpu::MMAMatrixType type) {

     ArrayRef<int64_t> retTypeShape = type.getShape();

     Type elementType = type.getElementType();

     auto use =

         llvm::StringSwitch<spirv::CooperativeMatrixUseKHR>(type.getOperand())

             .Case("AOp", spirv::CooperativeMatrixUseKHR::MatrixA)

             .Case("BOp", spirv::CooperativeMatrixUseKHR::MatrixB)

             .Default(spirv::CooperativeMatrixUseKHR::MatrixAcc);


     return spirv::CooperativeMatrixType::get(elementType, retTypeShape[0],

                                              retTypeShape[1],

                                              spirv::Scope::Subgroup, use);

   });

 }

GPUDialect.h

GPUToSPIRVPass.h

GPUToSPIRV.h

SUBI
#define SUBI(lhs, rhs)
Definition: LoopEmitter.cpp:37

ADDI
#define ADDI(lhs, rhs)
Definition: LoopEmitter.cpp:35

SPIRVAttributes.h

SPIRVConversion.h

SPIRVDialect.h

SPIRVEnums.h

SPIRVOps.h

SPIRVTypes.h

TargetAndABI.h

TypeUtilities.h

ValueRange.h

llvm::ArrayRef
Definition: LLVM.h:45

llvm::StringSwitch
Definition: LLVM.h:75

mlir::Builder::getI32Type
IntegerType getI32Type()
Definition: Builders.cpp:83

mlir::ConversionPatternRewriter
This class implements a pattern rewriter for use with ConversionPatterns.
Definition: DialectConversion.h:660

mlir::Location
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
Definition: Location.h:63

mlir::MLIRContext
MLIRContext is the top-level object for a collection of MLIR operations.
Definition: MLIRContext.h:60

mlir::OpBuilder::create
Operation * create(const OperationState &state)
Creates an operation given the fields represented as an OperationState.
Definition: Builders.cpp:464

mlir::OpConversionPattern
OpConversionPattern is a wrapper around ConversionPattern that allows for matching and rewriting agai...
Definition: DialectConversion.h:514

mlir::OpConversionPattern::OpConversionPattern
OpConversionPattern(MLIRContext *context, PatternBenefit benefit=1)
Definition: DialectConversion.h:518

mlir::RewritePatternSet
Definition: PatternMatch.h:807

mlir::RewritePatternSet::getContext
MLIRContext * getContext() const
Definition: PatternMatch.h:822

mlir::RewritePatternSet::add
RewritePatternSet & add(ConstructorArg &&arg, ConstructorArgs &&...args)
Add an instance of each of the pattern types 'Ts' to the pattern list with the given arguments.
Definition: PatternMatch.h:846

mlir::RewriterBase::notifyMatchFailure
std::enable_if_t<!std::is_convertible< CallbackT, Twine >::value, LogicalResult > notifyMatchFailure(Location loc, CallbackT &&reasonCallback)
Used to notify the listener that the IR failed to be rewritten because of a match failure,...
Definition: PatternMatch.h:718

mlir::RewriterBase::replaceOpWithNewOp
OpTy replaceOpWithNewOp(Operation *op, Args &&...args)
Replace the results of the given (original) op with a new op that is created without verification (re...
Definition: PatternMatch.h:536

mlir::SPIRVTypeConverter
Type conversion from builtin types to SPIR-V types for shader interface.
Definition: SPIRVConversion.h:67

mlir::TypeConverter::addConversion
void addConversion(FnT &&callback)
Register a conversion function.
Definition: DialectConversion.h:167

mlir::Type
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
Definition: Types.h:74

mlir::ValueRange
This class provides an abstraction over the different types of ranges over Values.
Definition: ValueRange.h:381

mlir::ValueRange::getType
type_range getType() const

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

mlir::Value::getType
Type getType() const
Return the type of this value.
Definition: Value.h:129

mlir::gpu::MMAMatrixType
MMAMatrix represents a matrix held by a subgroup for matrix-matrix multiply accumulate operations.
Definition: GPUDialect.h:130

mlir::gpu::MMAMatrixType::getShape
ArrayRef< int64_t > getShape() const
Get shape of the matrix.
Definition: GPUDialect.cpp:137

mlir::gpu::MMAMatrixType::getElementType
Type getElementType() const
Get elementType of a single element.
Definition: GPUDialect.cpp:141

mlir::gpu::MMAMatrixType::getOperand
StringRef getOperand() const
The general form of operation this type supports is given by the equation C += A*B.
Definition: GPUDialect.cpp:143

mlir::spirv::CooperativeMatrixType
Definition: SPIRVTypes.h:397

BuiltinAttributes.h

BuiltinTypes.h

mlir::lsp::CompletionItemKind::Value
@ Value

mlir::spirv::getElementPtr
Value getElementPtr(const SPIRVTypeConverter &typeConverter, MemRefType baseType, Value basePtr, ValueRange indices, Location loc, OpBuilder &builder)
Performs the index computation to get to the element at indices of the memory pointed to by basePtr,...
Definition: SPIRVConversion.cpp:1074

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::failure
LogicalResult failure(bool isFailure=true)
Utility function to generate a LogicalResult.
Definition: LogicalResult.h:62

mlir::populateGpuWMMAToSPIRVCoopMatrixKHRConversionPatterns
void populateGpuWMMAToSPIRVCoopMatrixKHRConversionPatterns(SPIRVTypeConverter &typeConverter, RewritePatternSet &patterns)
Collect a set of patterns to convert WMMA ops from GPU dialect to SPIRV, using the KHR Cooperative Ma...
Definition: WmmaOpsToSPIRV.cpp:295

mlir::success
LogicalResult success(bool isSuccess=true)
Utility function to generate a LogicalResult.
Definition: LogicalResult.h:56

mlir::createElementwiseOp
static bool createElementwiseOp(ConversionPatternRewriter &builder, gpu::SubgroupMmaElementwiseOp op, Type coopType, ValueRange operands)
Creates a SPIR-V op to replace the given GPU subgroup mma elementwise op when the elementwise op dire...
Definition: WmmaOpsToSPIRV.cpp:43

mlir::allOperandsHaveSameCoopMatrixType
bool allOperandsHaveSameCoopMatrixType(ValueRange operands)
Definition: WmmaOpsToSPIRV.cpp:85

mlir::populateMMAToSPIRVCoopMatrixTypeConversion
void populateMMAToSPIRVCoopMatrixTypeConversion(SPIRVTypeConverter &typeConverter)
Adds MMAMatrixType conversions to SPIR-V cooperative matrix KHR type conversion to the type converter...
Definition: WmmaOpsToSPIRV.cpp:307

mlir::get
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
Definition: BytecodeImplementation.h:510

mlir::LogicalResult
This class represents an efficient way to signal success or failure.
Definition: LogicalResult.h:26