doxygen/ConvertVectorToLLVM_8cpp_source.html

 //===- VectorToLLVM.cpp - Conversion from Vector to the LLVM dialect ------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Conversion/VectorToLLVM/ConvertVectorToLLVM.h"


 #include "mlir/Conversion/ArithCommon/AttrToLLVMConverter.h"

 #include "mlir/Conversion/ConvertToLLVM/ToLLVMInterface.h"

 #include "mlir/Conversion/LLVMCommon/PrintCallHelper.h"

 #include "mlir/Conversion/LLVMCommon/TypeConverter.h"

 #include "mlir/Conversion/LLVMCommon/VectorPattern.h"

 #include "mlir/Dialect/Arith/IR/Arith.h"

 #include "mlir/Dialect/Arith/Utils/Utils.h"

 #include "mlir/Dialect/LLVMIR/FunctionCallUtils.h"

 #include "mlir/Dialect/LLVMIR/LLVMDialect.h"

 #include "mlir/Dialect/MemRef/IR/MemRef.h"

 #include "mlir/Dialect/Vector/IR/VectorOps.h"

 #include "mlir/Dialect/Vector/Interfaces/MaskableOpInterface.h"

 #include "mlir/Dialect/Vector/Transforms/LoweringPatterns.h"

 #include "mlir/Dialect/Vector/Transforms/VectorTransforms.h"

 #include "mlir/IR/BuiltinAttributes.h"

 #include "mlir/IR/BuiltinTypeInterfaces.h"

 #include "mlir/IR/BuiltinTypes.h"

 #include "mlir/IR/TypeUtilities.h"

 #include "mlir/Target/LLVMIR/TypeToLLVM.h"

 #include "mlir/Transforms/DialectConversion.h"

 #include "llvm/ADT/APFloat.h"

 #include "llvm/Support/Casting.h"

 #include <optional>


 using namespace mlir;

 using namespace mlir::vector;


 // Helper that picks the proper sequence for inserting.

 static Value insertOne(ConversionPatternRewriter &rewriter,

                        const LLVMTypeConverter &typeConverter, Location loc,

                        Value val1, Value val2, Type llvmType, int64_t rank,

                        int64_t pos) {

   assert(rank > 0 && "0-D vector corner case should have been handled already");

   if (rank == 1) {

     auto idxType = rewriter.getIndexType();

     auto constant = rewriter.create<LLVM::ConstantOp>(

         loc, typeConverter.convertType(idxType),

         rewriter.getIntegerAttr(idxType, pos));

     return rewriter.create<LLVM::InsertElementOp>(loc, llvmType, val1, val2,

                                                   constant);

   }

   return rewriter.create<LLVM::InsertValueOp>(loc, val1, val2, pos);

 }


 // Helper that picks the proper sequence for extracting.

 static Value extractOne(ConversionPatternRewriter &rewriter,

                         const LLVMTypeConverter &typeConverter, Location loc,

                         Value val, Type llvmType, int64_t rank, int64_t pos) {

   if (rank <= 1) {

     auto idxType = rewriter.getIndexType();

     auto constant = rewriter.create<LLVM::ConstantOp>(

         loc, typeConverter.convertType(idxType),

         rewriter.getIntegerAttr(idxType, pos));

     return rewriter.create<LLVM::ExtractElementOp>(loc, llvmType, val,

                                                    constant);

   }

   return rewriter.create<LLVM::ExtractValueOp>(loc, val, pos);

 }


 // Helper that returns data layout alignment of a vector.

 LogicalResult getVectorAlignment(const LLVMTypeConverter &typeConverter,

                                  VectorType vectorType, unsigned &align) {

   Type convertedVectorTy = typeConverter.convertType(vectorType);

   if (!convertedVectorTy)

     return failure();


   llvm::LLVMContext llvmContext;

   align = LLVM::TypeToLLVMIRTranslator(llvmContext)

               .getPreferredAlignment(convertedVectorTy,

                                      typeConverter.getDataLayout());


   return success();

 }


 // Helper that returns data layout alignment of a memref.

 LogicalResult getMemRefAlignment(const LLVMTypeConverter &typeConverter,

                                  MemRefType memrefType, unsigned &align) {

   Type elementTy = typeConverter.convertType(memrefType.getElementType());

   if (!elementTy)

     return failure();


   // TODO: this should use the MLIR data layout when it becomes available and

   // stop depending on translation.

   llvm::LLVMContext llvmContext;

   align = LLVM::TypeToLLVMIRTranslator(llvmContext)

               .getPreferredAlignment(elementTy, typeConverter.getDataLayout());

   return success();

 }


 // Helper to resolve the alignment for vector load/store, gather and scatter

 // ops. If useVectorAlignment is true, get the preferred alignment for the

 // vector type in the operation. This option is used for hardware backends with

 // vectorization. Otherwise, use the preferred alignment of the element type of

 // the memref. Note that if you choose to use vector alignment, the shape of the

 // vector type must be resolved before the ConvertVectorToLLVM pass is run.

 LogicalResult getVectorToLLVMAlignment(const LLVMTypeConverter &typeConverter,

                                        VectorType vectorType,

                                        MemRefType memrefType, unsigned &align,

                                        bool useVectorAlignment) {

   if (useVectorAlignment) {

     if (failed(getVectorAlignment(typeConverter, vectorType, align))) {

       return failure();

     }

   } else {

     if (failed(getMemRefAlignment(typeConverter, memrefType, align))) {

       return failure();

     }

   }

   return success();

 }


 // Check if the last stride is non-unit and has a valid memory space.

 static LogicalResult isMemRefTypeSupported(MemRefType memRefType,

                                            const LLVMTypeConverter &converter) {

   if (!memRefType.isLastDimUnitStride())

     return failure();

   if (failed(converter.getMemRefAddressSpace(memRefType)))

     return failure();

   return success();

 }


 // Add an index vector component to a base pointer.

 static Value getIndexedPtrs(ConversionPatternRewriter &rewriter, Location loc,

                             const LLVMTypeConverter &typeConverter,

                             MemRefType memRefType, Value llvmMemref, Value base,

                             Value index, VectorType vectorType) {

   assert(succeeded(isMemRefTypeSupported(memRefType, typeConverter)) &&

          "unsupported memref type");

   assert(vectorType.getRank() == 1 && "expected a 1-d vector type");

   auto pType = MemRefDescriptor(llvmMemref).getElementPtrType();

   auto ptrsType =

       LLVM::getVectorType(pType, vectorType.getDimSize(0),

                           /*isScalable=*/vectorType.getScalableDims()[0]);

   return rewriter.create<LLVM::GEPOp>(

       loc, ptrsType, typeConverter.convertType(memRefType.getElementType()),

       base, index);

 }


 /// Convert `foldResult` into a Value. Integer attribute is converted to

 /// an LLVM constant op.

 static Value getAsLLVMValue(OpBuilder &builder, Location loc,

                             OpFoldResult foldResult) {

   if (auto attr = dyn_cast<Attribute>(foldResult)) {

     auto intAttr = cast<IntegerAttr>(attr);

     return builder.create<LLVM::ConstantOp>(loc, intAttr).getResult();

   }


   return cast<Value>(foldResult);

 }


 namespace {


 /// Trivial Vector to LLVM conversions

 using VectorScaleOpConversion =

     OneToOneConvertToLLVMPattern<vector::VectorScaleOp, LLVM::vscale>;


 /// Conversion pattern for a vector.bitcast.

 class VectorBitCastOpConversion

     : public ConvertOpToLLVMPattern<vector::BitCastOp> {

 public:

   using ConvertOpToLLVMPattern<vector::BitCastOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::BitCastOp bitCastOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     // Only 0-D and 1-D vectors can be lowered to LLVM.

     VectorType resultTy = bitCastOp.getResultVectorType();

     if (resultTy.getRank() > 1)

       return failure();

     Type newResultTy = typeConverter->convertType(resultTy);

     rewriter.replaceOpWithNewOp<LLVM::BitcastOp>(bitCastOp, newResultTy,

                                                  adaptor.getOperands()[0]);

     return success();

   }

 };


 /// Conversion pattern for a vector.matrix_multiply.

 /// This is lowered directly to the proper llvm.intr.matrix.multiply.

 class VectorMatmulOpConversion

     : public ConvertOpToLLVMPattern<vector::MatmulOp> {

 public:

   using ConvertOpToLLVMPattern<vector::MatmulOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::MatmulOp matmulOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     rewriter.replaceOpWithNewOp<LLVM::MatrixMultiplyOp>(

         matmulOp, typeConverter->convertType(matmulOp.getRes().getType()),

         adaptor.getLhs(), adaptor.getRhs(), matmulOp.getLhsRows(),

         matmulOp.getLhsColumns(), matmulOp.getRhsColumns());

     return success();

   }

 };


 /// Conversion pattern for a vector.flat_transpose.

 /// This is lowered directly to the proper llvm.intr.matrix.transpose.

 class VectorFlatTransposeOpConversion

     : public ConvertOpToLLVMPattern<vector::FlatTransposeOp> {

 public:

   using ConvertOpToLLVMPattern<vector::FlatTransposeOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::FlatTransposeOp transOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     rewriter.replaceOpWithNewOp<LLVM::MatrixTransposeOp>(

         transOp, typeConverter->convertType(transOp.getRes().getType()),

         adaptor.getMatrix(), transOp.getRows(), transOp.getColumns());

     return success();

   }

 };


 /// Overloaded utility that replaces a vector.load, vector.store,

 /// vector.maskedload and vector.maskedstore with their respective LLVM

 /// couterparts.

 static void replaceLoadOrStoreOp(vector::LoadOp loadOp,

                                  vector::LoadOpAdaptor adaptor,

                                  VectorType vectorTy, Value ptr, unsigned align,

                                  ConversionPatternRewriter &rewriter) {

   rewriter.replaceOpWithNewOp<LLVM::LoadOp>(loadOp, vectorTy, ptr, align,

                                             /*volatile_=*/false,

                                             loadOp.getNontemporal());

 }


 static void replaceLoadOrStoreOp(vector::MaskedLoadOp loadOp,

                                  vector::MaskedLoadOpAdaptor adaptor,

                                  VectorType vectorTy, Value ptr, unsigned align,

                                  ConversionPatternRewriter &rewriter) {

   rewriter.replaceOpWithNewOp<LLVM::MaskedLoadOp>(

       loadOp, vectorTy, ptr, adaptor.getMask(), adaptor.getPassThru(), align);

 }


 static void replaceLoadOrStoreOp(vector::StoreOp storeOp,

                                  vector::StoreOpAdaptor adaptor,

                                  VectorType vectorTy, Value ptr, unsigned align,

                                  ConversionPatternRewriter &rewriter) {

   rewriter.replaceOpWithNewOp<LLVM::StoreOp>(storeOp, adaptor.getValueToStore(),

                                              ptr, align, /*volatile_=*/false,

                                              storeOp.getNontemporal());

 }


 static void replaceLoadOrStoreOp(vector::MaskedStoreOp storeOp,

                                  vector::MaskedStoreOpAdaptor adaptor,

                                  VectorType vectorTy, Value ptr, unsigned align,

                                  ConversionPatternRewriter &rewriter) {

   rewriter.replaceOpWithNewOp<LLVM::MaskedStoreOp>(

       storeOp, adaptor.getValueToStore(), ptr, adaptor.getMask(), align);

 }


 /// Conversion pattern for a vector.load, vector.store, vector.maskedload, and

 /// vector.maskedstore.

 template <class LoadOrStoreOp>

 class VectorLoadStoreConversion : public ConvertOpToLLVMPattern<LoadOrStoreOp> {

 public:

   explicit VectorLoadStoreConversion(const LLVMTypeConverter &typeConv,

                                      bool useVectorAlign)

       : ConvertOpToLLVMPattern<LoadOrStoreOp>(typeConv),

         useVectorAlignment(useVectorAlign) {}

   using ConvertOpToLLVMPattern<LoadOrStoreOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(LoadOrStoreOp loadOrStoreOp,

                   typename LoadOrStoreOp::Adaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     // Only 1-D vectors can be lowered to LLVM.

     VectorType vectorTy = loadOrStoreOp.getVectorType();

     if (vectorTy.getRank() > 1)

       return failure();


     auto loc = loadOrStoreOp->getLoc();

     MemRefType memRefTy = loadOrStoreOp.getMemRefType();


     // Resolve alignment.

     unsigned align;

     if (failed(getVectorToLLVMAlignment(*this->getTypeConverter(), vectorTy,

                                         memRefTy, align, useVectorAlignment)))

       return rewriter.notifyMatchFailure(loadOrStoreOp,

                                          "could not resolve alignment");


     // Resolve address.

     auto vtype = cast<VectorType>(

         this->typeConverter->convertType(loadOrStoreOp.getVectorType()));

     Value dataPtr = this->getStridedElementPtr(loc, memRefTy, adaptor.getBase(),

                                                adaptor.getIndices(), rewriter);

     replaceLoadOrStoreOp(loadOrStoreOp, adaptor, vtype, dataPtr, align,

                          rewriter);

     return success();

   }


 private:

   // If true, use the preferred alignment of the vector type.

   // If false, use the preferred alignment of the element type

   // of the memref. This flag is intended for use with hardware

   // backends that require alignment of vector operations.

   const bool useVectorAlignment;

 };


 /// Conversion pattern for a vector.gather.

 class VectorGatherOpConversion

     : public ConvertOpToLLVMPattern<vector::GatherOp> {

 public:

   explicit VectorGatherOpConversion(const LLVMTypeConverter &typeConv,

                                     bool useVectorAlign)

       : ConvertOpToLLVMPattern<vector::GatherOp>(typeConv),

         useVectorAlignment(useVectorAlign) {}

   using ConvertOpToLLVMPattern<vector::GatherOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::GatherOp gather, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     Location loc = gather->getLoc();

     MemRefType memRefType = dyn_cast<MemRefType>(gather.getBaseType());

     assert(memRefType && "The base should be bufferized");


     if (failed(isMemRefTypeSupported(memRefType, *this->getTypeConverter())))

       return rewriter.notifyMatchFailure(gather, "memref type not supported");


     VectorType vType = gather.getVectorType();

     if (vType.getRank() > 1) {

       return rewriter.notifyMatchFailure(

           gather, "only 1-D vectors can be lowered to LLVM");

     }


     // Resolve alignment.

     unsigned align;

     if (failed(getVectorToLLVMAlignment(*this->getTypeConverter(), vType,

                                         memRefType, align, useVectorAlignment)))

       return rewriter.notifyMatchFailure(gather, "could not resolve alignment");


     // Resolve address.

     Value ptr = getStridedElementPtr(loc, memRefType, adaptor.getBase(),

                                      adaptor.getIndices(), rewriter);

     Value base = adaptor.getBase();

     Value ptrs =

         getIndexedPtrs(rewriter, loc, *this->getTypeConverter(), memRefType,

                        base, ptr, adaptor.getIndexVec(), vType);


     // Replace with the gather intrinsic.

     rewriter.replaceOpWithNewOp<LLVM::masked_gather>(

         gather, typeConverter->convertType(vType), ptrs, adaptor.getMask(),

         adaptor.getPassThru(), rewriter.getI32IntegerAttr(align));

     return success();

   }


 private:

   // If true, use the preferred alignment of the vector type.

   // If false, use the preferred alignment of the element type

   // of the memref. This flag is intended for use with hardware

   // backends that require alignment of vector operations.

   const bool useVectorAlignment;

 };


 /// Conversion pattern for a vector.scatter.

 class VectorScatterOpConversion

     : public ConvertOpToLLVMPattern<vector::ScatterOp> {

 public:

   explicit VectorScatterOpConversion(const LLVMTypeConverter &typeConv,

                                      bool useVectorAlign)

       : ConvertOpToLLVMPattern<vector::ScatterOp>(typeConv),

         useVectorAlignment(useVectorAlign) {}


   using ConvertOpToLLVMPattern<vector::ScatterOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::ScatterOp scatter, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto loc = scatter->getLoc();

     MemRefType memRefType = scatter.getMemRefType();


     if (failed(isMemRefTypeSupported(memRefType, *this->getTypeConverter())))

       return rewriter.notifyMatchFailure(scatter, "memref type not supported");


     VectorType vType = scatter.getVectorType();

     if (vType.getRank() > 1) {

       return rewriter.notifyMatchFailure(

           scatter, "only 1-D vectors can be lowered to LLVM");

     }


     // Resolve alignment.

     unsigned align;

     if (failed(getVectorToLLVMAlignment(*this->getTypeConverter(), vType,

                                         memRefType, align, useVectorAlignment)))

       return rewriter.notifyMatchFailure(scatter,

                                          "could not resolve alignment");


     // Resolve address.

     Value ptr = getStridedElementPtr(loc, memRefType, adaptor.getBase(),

                                      adaptor.getIndices(), rewriter);

     Value ptrs =

         getIndexedPtrs(rewriter, loc, *this->getTypeConverter(), memRefType,

                        adaptor.getBase(), ptr, adaptor.getIndexVec(), vType);


     // Replace with the scatter intrinsic.

     rewriter.replaceOpWithNewOp<LLVM::masked_scatter>(

         scatter, adaptor.getValueToStore(), ptrs, adaptor.getMask(),

         rewriter.getI32IntegerAttr(align));

     return success();

   }


 private:

   // If true, use the preferred alignment of the vector type.

   // If false, use the preferred alignment of the element type

   // of the memref. This flag is intended for use with hardware

   // backends that require alignment of vector operations.

   const bool useVectorAlignment;

 };


 /// Conversion pattern for a vector.expandload.

 class VectorExpandLoadOpConversion

     : public ConvertOpToLLVMPattern<vector::ExpandLoadOp> {

 public:

   using ConvertOpToLLVMPattern<vector::ExpandLoadOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::ExpandLoadOp expand, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto loc = expand->getLoc();

     MemRefType memRefType = expand.getMemRefType();


     // Resolve address.

     auto vtype = typeConverter->convertType(expand.getVectorType());

     Value ptr = getStridedElementPtr(loc, memRefType, adaptor.getBase(),

                                      adaptor.getIndices(), rewriter);


     rewriter.replaceOpWithNewOp<LLVM::masked_expandload>(

         expand, vtype, ptr, adaptor.getMask(), adaptor.getPassThru());

     return success();

   }

 };


 /// Conversion pattern for a vector.compressstore.

 class VectorCompressStoreOpConversion

     : public ConvertOpToLLVMPattern<vector::CompressStoreOp> {

 public:

   using ConvertOpToLLVMPattern<vector::CompressStoreOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::CompressStoreOp compress, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto loc = compress->getLoc();

     MemRefType memRefType = compress.getMemRefType();


     // Resolve address.

     Value ptr = getStridedElementPtr(loc, memRefType, adaptor.getBase(),

                                      adaptor.getIndices(), rewriter);


     rewriter.replaceOpWithNewOp<LLVM::masked_compressstore>(

         compress, adaptor.getValueToStore(), ptr, adaptor.getMask());

     return success();

   }

 };


 /// Reduction neutral classes for overloading.

 class ReductionNeutralZero {};

 class ReductionNeutralIntOne {};

 class ReductionNeutralFPOne {};

 class ReductionNeutralAllOnes {};

 class ReductionNeutralSIntMin {};

 class ReductionNeutralUIntMin {};

 class ReductionNeutralSIntMax {};

 class ReductionNeutralUIntMax {};

 class ReductionNeutralFPMin {};

 class ReductionNeutralFPMax {};


 /// Create the reduction neutral zero value.

 static Value createReductionNeutralValue(ReductionNeutralZero neutral,

                                          ConversionPatternRewriter &rewriter,

                                          Location loc, Type llvmType) {

   return rewriter.create<LLVM::ConstantOp>(loc, llvmType,

                                            rewriter.getZeroAttr(llvmType));

 }


 /// Create the reduction neutral integer one value.

 static Value createReductionNeutralValue(ReductionNeutralIntOne neutral,

                                          ConversionPatternRewriter &rewriter,

                                          Location loc, Type llvmType) {

   return rewriter.create<LLVM::ConstantOp>(

       loc, llvmType, rewriter.getIntegerAttr(llvmType, 1));

 }


 /// Create the reduction neutral fp one value.

 static Value createReductionNeutralValue(ReductionNeutralFPOne neutral,

                                          ConversionPatternRewriter &rewriter,

                                          Location loc, Type llvmType) {

   return rewriter.create<LLVM::ConstantOp>(

       loc, llvmType, rewriter.getFloatAttr(llvmType, 1.0));

 }


 /// Create the reduction neutral all-ones value.

 static Value createReductionNeutralValue(ReductionNeutralAllOnes neutral,

                                          ConversionPatternRewriter &rewriter,

                                          Location loc, Type llvmType) {

   return rewriter.create<LLVM::ConstantOp>(

       loc, llvmType,

       rewriter.getIntegerAttr(

           llvmType, llvm::APInt::getAllOnes(llvmType.getIntOrFloatBitWidth())));

 }


 /// Create the reduction neutral signed int minimum value.

 static Value createReductionNeutralValue(ReductionNeutralSIntMin neutral,

                                          ConversionPatternRewriter &rewriter,

                                          Location loc, Type llvmType) {

   return rewriter.create<LLVM::ConstantOp>(

       loc, llvmType,

       rewriter.getIntegerAttr(llvmType, llvm::APInt::getSignedMinValue(

                                             llvmType.getIntOrFloatBitWidth())));

 }


 /// Create the reduction neutral unsigned int minimum value.

 static Value createReductionNeutralValue(ReductionNeutralUIntMin neutral,

                                          ConversionPatternRewriter &rewriter,

                                          Location loc, Type llvmType) {

   return rewriter.create<LLVM::ConstantOp>(

       loc, llvmType,

       rewriter.getIntegerAttr(llvmType, llvm::APInt::getMinValue(

                                             llvmType.getIntOrFloatBitWidth())));

 }


 /// Create the reduction neutral signed int maximum value.

 static Value createReductionNeutralValue(ReductionNeutralSIntMax neutral,

                                          ConversionPatternRewriter &rewriter,

                                          Location loc, Type llvmType) {

   return rewriter.create<LLVM::ConstantOp>(

       loc, llvmType,

       rewriter.getIntegerAttr(llvmType, llvm::APInt::getSignedMaxValue(

                                             llvmType.getIntOrFloatBitWidth())));

 }


 /// Create the reduction neutral unsigned int maximum value.

 static Value createReductionNeutralValue(ReductionNeutralUIntMax neutral,

                                          ConversionPatternRewriter &rewriter,

                                          Location loc, Type llvmType) {

   return rewriter.create<LLVM::ConstantOp>(

       loc, llvmType,

       rewriter.getIntegerAttr(llvmType, llvm::APInt::getMaxValue(

                                             llvmType.getIntOrFloatBitWidth())));

 }


 /// Create the reduction neutral fp minimum value.

 static Value createReductionNeutralValue(ReductionNeutralFPMin neutral,

                                          ConversionPatternRewriter &rewriter,

                                          Location loc, Type llvmType) {

   auto floatType = cast<FloatType>(llvmType);

   return rewriter.create<LLVM::ConstantOp>(

       loc, llvmType,

       rewriter.getFloatAttr(

           llvmType, llvm::APFloat::getQNaN(floatType.getFloatSemantics(),

                                            /*Negative=*/false)));

 }


 /// Create the reduction neutral fp maximum value.

 static Value createReductionNeutralValue(ReductionNeutralFPMax neutral,

                                          ConversionPatternRewriter &rewriter,

                                          Location loc, Type llvmType) {

   auto floatType = cast<FloatType>(llvmType);

   return rewriter.create<LLVM::ConstantOp>(

       loc, llvmType,

       rewriter.getFloatAttr(

           llvmType, llvm::APFloat::getQNaN(floatType.getFloatSemantics(),

                                            /*Negative=*/true)));

 }


 /// Returns `accumulator` if it has a valid value. Otherwise, creates and

 /// returns a new accumulator value using `ReductionNeutral`.

 template <class ReductionNeutral>

 static Value getOrCreateAccumulator(ConversionPatternRewriter &rewriter,

                                     Location loc, Type llvmType,

                                     Value accumulator) {

   if (accumulator)

     return accumulator;


   return createReductionNeutralValue(ReductionNeutral(), rewriter, loc,

                                      llvmType);

 }


 /// Creates a value with the 1-D vector shape provided in `llvmType`.

 /// This is used as effective vector length by some intrinsics supporting

 /// dynamic vector lengths at runtime.

 static Value createVectorLengthValue(ConversionPatternRewriter &rewriter,

                                      Location loc, Type llvmType) {

   VectorType vType = cast<VectorType>(llvmType);

   auto vShape = vType.getShape();

   assert(vShape.size() == 1 && "Unexpected multi-dim vector type");


   Value baseVecLength = rewriter.create<LLVM::ConstantOp>(

       loc, rewriter.getI32Type(),

       rewriter.getIntegerAttr(rewriter.getI32Type(), vShape[0]));


   if (!vType.getScalableDims()[0])

     return baseVecLength;


   // For a scalable vector type, create and return `vScale * baseVecLength`.

   Value vScale = rewriter.create<vector::VectorScaleOp>(loc);

   vScale =

       rewriter.create<arith::IndexCastOp>(loc, rewriter.getI32Type(), vScale);

   Value scalableVecLength =

       rewriter.create<arith::MulIOp>(loc, baseVecLength, vScale);

   return scalableVecLength;

 }


 /// Helper method to lower a `vector.reduction` op that performs an arithmetic

 /// operation like add,mul, etc.. `VectorOp` is the LLVM vector intrinsic to use

 /// and `ScalarOp` is the scalar operation used to add the accumulation value if

 /// non-null.

 template <class LLVMRedIntrinOp, class ScalarOp>

 static Value createIntegerReductionArithmeticOpLowering(

     ConversionPatternRewriter &rewriter, Location loc, Type llvmType,

     Value vectorOperand, Value accumulator) {


   Value result = rewriter.create<LLVMRedIntrinOp>(loc, llvmType, vectorOperand);


   if (accumulator)

     result = rewriter.create<ScalarOp>(loc, accumulator, result);

   return result;

 }


 /// Helper method to lower a `vector.reduction` operation that performs

 /// a comparison operation like `min`/`max`. `VectorOp` is the LLVM vector

 /// intrinsic to use and `predicate` is the predicate to use to compare+combine

 /// the accumulator value if non-null.

 template <class LLVMRedIntrinOp>

 static Value createIntegerReductionComparisonOpLowering(

     ConversionPatternRewriter &rewriter, Location loc, Type llvmType,

     Value vectorOperand, Value accumulator, LLVM::ICmpPredicate predicate) {

   Value result = rewriter.create<LLVMRedIntrinOp>(loc, llvmType, vectorOperand);

   if (accumulator) {

     Value cmp =

         rewriter.create<LLVM::ICmpOp>(loc, predicate, accumulator, result);

     result = rewriter.create<LLVM::SelectOp>(loc, cmp, accumulator, result);

   }

   return result;

 }


 namespace {

 template <typename Source>

 struct VectorToScalarMapper;

 template <>

 struct VectorToScalarMapper<LLVM::vector_reduce_fmaximum> {

   using Type = LLVM::MaximumOp;

 };

 template <>

 struct VectorToScalarMapper<LLVM::vector_reduce_fminimum> {

   using Type = LLVM::MinimumOp;

 };

 template <>

 struct VectorToScalarMapper<LLVM::vector_reduce_fmax> {

   using Type = LLVM::MaxNumOp;

 };

 template <>

 struct VectorToScalarMapper<LLVM::vector_reduce_fmin> {

   using Type = LLVM::MinNumOp;

 };

 } // namespace


 template <class LLVMRedIntrinOp>

 static Value createFPReductionComparisonOpLowering(

     ConversionPatternRewriter &rewriter, Location loc, Type llvmType,

     Value vectorOperand, Value accumulator, LLVM::FastmathFlagsAttr fmf) {

   Value result =

       rewriter.create<LLVMRedIntrinOp>(loc, llvmType, vectorOperand, fmf);


   if (accumulator) {

     result =

         rewriter.create<typename VectorToScalarMapper<LLVMRedIntrinOp>::Type>(

             loc, result, accumulator);

   }


   return result;

 }


 /// Reduction neutral classes for overloading

 class MaskNeutralFMaximum {};

 class MaskNeutralFMinimum {};


 /// Get the mask neutral floating point maximum value

 static llvm::APFloat

 getMaskNeutralValue(MaskNeutralFMaximum,

                     const llvm::fltSemantics &floatSemantics) {

   return llvm::APFloat::getSmallest(floatSemantics, /*Negative=*/true);

 }

 /// Get the mask neutral floating point minimum value

 static llvm::APFloat

 getMaskNeutralValue(MaskNeutralFMinimum,

                     const llvm::fltSemantics &floatSemantics) {

   return llvm::APFloat::getLargest(floatSemantics, /*Negative=*/false);

 }


 /// Create the mask neutral floating point MLIR vector constant

 template <typename MaskNeutral>

 static Value createMaskNeutralValue(ConversionPatternRewriter &rewriter,

                                     Location loc, Type llvmType,

                                     Type vectorType) {

   const auto &floatSemantics = cast<FloatType>(llvmType).getFloatSemantics();

   auto value = getMaskNeutralValue(MaskNeutral{}, floatSemantics);

   auto denseValue = DenseElementsAttr::get(cast<ShapedType>(vectorType), value);

   return rewriter.create<LLVM::ConstantOp>(loc, vectorType, denseValue);

 }


 /// Lowers masked `fmaximum` and `fminimum` reductions using the non-masked

 /// intrinsics. It is a workaround to overcome the lack of masked intrinsics for

 /// `fmaximum`/`fminimum`.

 /// More information: https://github.com/llvm/llvm-project/issues/64940

 template <class LLVMRedIntrinOp, class MaskNeutral>

 static Value

 lowerMaskedReductionWithRegular(ConversionPatternRewriter &rewriter,

                                 Location loc, Type llvmType,

                                 Value vectorOperand, Value accumulator,

                                 Value mask, LLVM::FastmathFlagsAttr fmf) {

   const Value vectorMaskNeutral = createMaskNeutralValue<MaskNeutral>(

       rewriter, loc, llvmType, vectorOperand.getType());

   const Value selectedVectorByMask = rewriter.create<LLVM::SelectOp>(

       loc, mask, vectorOperand, vectorMaskNeutral);

   return createFPReductionComparisonOpLowering<LLVMRedIntrinOp>(

       rewriter, loc, llvmType, selectedVectorByMask, accumulator, fmf);

 }


 template <class LLVMRedIntrinOp, class ReductionNeutral>

 static Value

 lowerReductionWithStartValue(ConversionPatternRewriter &rewriter, Location loc,

                              Type llvmType, Value vectorOperand,

                              Value accumulator, LLVM::FastmathFlagsAttr fmf) {

   accumulator = getOrCreateAccumulator<ReductionNeutral>(rewriter, loc,

                                                          llvmType, accumulator);

   return rewriter.create<LLVMRedIntrinOp>(loc, llvmType,

                                           /*startValue=*/accumulator,

                                           vectorOperand, fmf);

 }


 /// Overloaded methods to lower a *predicated* reduction to an llvm intrinsic

 /// that requires a start value. This start value format spans across fp

 /// reductions without mask and all the masked reduction intrinsics.

 template <class LLVMVPRedIntrinOp, class ReductionNeutral>

 static Value

 lowerPredicatedReductionWithStartValue(ConversionPatternRewriter &rewriter,

                                        Location loc, Type llvmType,

                                        Value vectorOperand, Value accumulator) {

   accumulator = getOrCreateAccumulator<ReductionNeutral>(rewriter, loc,

                                                          llvmType, accumulator);

   return rewriter.create<LLVMVPRedIntrinOp>(loc, llvmType,

                                             /*startValue=*/accumulator,

                                             vectorOperand);

 }


 template <class LLVMVPRedIntrinOp, class ReductionNeutral>

 static Value lowerPredicatedReductionWithStartValue(

     ConversionPatternRewriter &rewriter, Location loc, Type llvmType,

     Value vectorOperand, Value accumulator, Value mask) {

   accumulator = getOrCreateAccumulator<ReductionNeutral>(rewriter, loc,

                                                          llvmType, accumulator);

   Value vectorLength =

       createVectorLengthValue(rewriter, loc, vectorOperand.getType());

   return rewriter.create<LLVMVPRedIntrinOp>(loc, llvmType,

                                             /*startValue=*/accumulator,

                                             vectorOperand, mask, vectorLength);

 }


 template <class LLVMIntVPRedIntrinOp, class IntReductionNeutral,

           class LLVMFPVPRedIntrinOp, class FPReductionNeutral>

 static Value lowerPredicatedReductionWithStartValue(

     ConversionPatternRewriter &rewriter, Location loc, Type llvmType,

     Value vectorOperand, Value accumulator, Value mask) {

   if (llvmType.isIntOrIndex())

     return lowerPredicatedReductionWithStartValue<LLVMIntVPRedIntrinOp,

                                                   IntReductionNeutral>(

         rewriter, loc, llvmType, vectorOperand, accumulator, mask);


   // FP dispatch.

   return lowerPredicatedReductionWithStartValue<LLVMFPVPRedIntrinOp,

                                                 FPReductionNeutral>(

       rewriter, loc, llvmType, vectorOperand, accumulator, mask);

 }


 /// Conversion pattern for all vector reductions.

 class VectorReductionOpConversion

     : public ConvertOpToLLVMPattern<vector::ReductionOp> {

 public:

   explicit VectorReductionOpConversion(const LLVMTypeConverter &typeConv,

                                        bool reassociateFPRed)

       : ConvertOpToLLVMPattern<vector::ReductionOp>(typeConv),

         reassociateFPReductions(reassociateFPRed) {}


   LogicalResult

   matchAndRewrite(vector::ReductionOp reductionOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto kind = reductionOp.getKind();

     Type eltType = reductionOp.getDest().getType();

     Type llvmType = typeConverter->convertType(eltType);

     Value operand = adaptor.getVector();

     Value acc = adaptor.getAcc();

     Location loc = reductionOp.getLoc();


     if (eltType.isIntOrIndex()) {

       // Integer reductions: add/mul/min/max/and/or/xor.

       Value result;

       switch (kind) {

       case vector::CombiningKind::ADD:

         result =

             createIntegerReductionArithmeticOpLowering<LLVM::vector_reduce_add,

                                                        LLVM::AddOp>(

                 rewriter, loc, llvmType, operand, acc);

         break;

       case vector::CombiningKind::MUL:

         result =

             createIntegerReductionArithmeticOpLowering<LLVM::vector_reduce_mul,

                                                        LLVM::MulOp>(

                 rewriter, loc, llvmType, operand, acc);

         break;

       case vector::CombiningKind::MINUI:

         result = createIntegerReductionComparisonOpLowering<

             LLVM::vector_reduce_umin>(rewriter, loc, llvmType, operand, acc,

                                       LLVM::ICmpPredicate::ule);

         break;

       case vector::CombiningKind::MINSI:

         result = createIntegerReductionComparisonOpLowering<

             LLVM::vector_reduce_smin>(rewriter, loc, llvmType, operand, acc,

                                       LLVM::ICmpPredicate::sle);

         break;

       case vector::CombiningKind::MAXUI:

         result = createIntegerReductionComparisonOpLowering<

             LLVM::vector_reduce_umax>(rewriter, loc, llvmType, operand, acc,

                                       LLVM::ICmpPredicate::uge);

         break;

       case vector::CombiningKind::MAXSI:

         result = createIntegerReductionComparisonOpLowering<

             LLVM::vector_reduce_smax>(rewriter, loc, llvmType, operand, acc,

                                       LLVM::ICmpPredicate::sge);

         break;

       case vector::CombiningKind::AND:

         result =

             createIntegerReductionArithmeticOpLowering<LLVM::vector_reduce_and,

                                                        LLVM::AndOp>(

                 rewriter, loc, llvmType, operand, acc);

         break;

       case vector::CombiningKind::OR:

         result =

             createIntegerReductionArithmeticOpLowering<LLVM::vector_reduce_or,

                                                        LLVM::OrOp>(

                 rewriter, loc, llvmType, operand, acc);

         break;

       case vector::CombiningKind::XOR:

         result =

             createIntegerReductionArithmeticOpLowering<LLVM::vector_reduce_xor,

                                                        LLVM::XOrOp>(

                 rewriter, loc, llvmType, operand, acc);

         break;

       default:

         return failure();

       }

       rewriter.replaceOp(reductionOp, result);


       return success();

     }


     if (!isa<FloatType>(eltType))

       return failure();


     arith::FastMathFlagsAttr fMFAttr = reductionOp.getFastMathFlagsAttr();

     LLVM::FastmathFlagsAttr fmf = LLVM::FastmathFlagsAttr::get(

         reductionOp.getContext(),

         convertArithFastMathFlagsToLLVM(fMFAttr.getValue()));

     fmf = LLVM::FastmathFlagsAttr::get(

         reductionOp.getContext(),

         fmf.getValue() | (reassociateFPReductions ? LLVM::FastmathFlags::reassoc

                                                   : LLVM::FastmathFlags::none));


     // Floating-point reductions: add/mul/min/max

     Value result;

     if (kind == vector::CombiningKind::ADD) {

       result = lowerReductionWithStartValue<LLVM::vector_reduce_fadd,

                                             ReductionNeutralZero>(

           rewriter, loc, llvmType, operand, acc, fmf);

     } else if (kind == vector::CombiningKind::MUL) {

       result = lowerReductionWithStartValue<LLVM::vector_reduce_fmul,

                                             ReductionNeutralFPOne>(

           rewriter, loc, llvmType, operand, acc, fmf);

     } else if (kind == vector::CombiningKind::MINIMUMF) {

       result =

           createFPReductionComparisonOpLowering<LLVM::vector_reduce_fminimum>(

               rewriter, loc, llvmType, operand, acc, fmf);

     } else if (kind == vector::CombiningKind::MAXIMUMF) {

       result =

           createFPReductionComparisonOpLowering<LLVM::vector_reduce_fmaximum>(

               rewriter, loc, llvmType, operand, acc, fmf);

     } else if (kind == vector::CombiningKind::MINNUMF) {

       result = createFPReductionComparisonOpLowering<LLVM::vector_reduce_fmin>(

           rewriter, loc, llvmType, operand, acc, fmf);

     } else if (kind == vector::CombiningKind::MAXNUMF) {

       result = createFPReductionComparisonOpLowering<LLVM::vector_reduce_fmax>(

           rewriter, loc, llvmType, operand, acc, fmf);

     } else

       return failure();


     rewriter.replaceOp(reductionOp, result);

     return success();

   }


 private:

   const bool reassociateFPReductions;

 };


 /// Base class to convert a `vector.mask` operation while matching traits

 /// of the maskable operation nested inside. A `VectorMaskOpConversionBase`

 /// instance matches against a `vector.mask` operation. The `matchAndRewrite`

 /// method performs a second match against the maskable operation `MaskedOp`.

 /// Finally, it invokes the virtual method `matchAndRewriteMaskableOp` to be

 /// implemented by the concrete conversion classes. This method can match

 /// against specific traits of the `vector.mask` and the maskable operation. It

 /// must replace the `vector.mask` operation.

 template <class MaskedOp>

 class VectorMaskOpConversionBase

     : public ConvertOpToLLVMPattern<vector::MaskOp> {

 public:

   using ConvertOpToLLVMPattern<vector::MaskOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::MaskOp maskOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const final {

     // Match against the maskable operation kind.

     auto maskedOp = llvm::dyn_cast_or_null<MaskedOp>(maskOp.getMaskableOp());

     if (!maskedOp)

       return failure();

     return matchAndRewriteMaskableOp(maskOp, maskedOp, rewriter);

   }


 protected:

   virtual LogicalResult

   matchAndRewriteMaskableOp(vector::MaskOp maskOp,

                             vector::MaskableOpInterface maskableOp,

                             ConversionPatternRewriter &rewriter) const = 0;

 };


 class MaskedReductionOpConversion

     : public VectorMaskOpConversionBase<vector::ReductionOp> {


 public:

   using VectorMaskOpConversionBase<

       vector::ReductionOp>::VectorMaskOpConversionBase;


   LogicalResult matchAndRewriteMaskableOp(

       vector::MaskOp maskOp, MaskableOpInterface maskableOp,

       ConversionPatternRewriter &rewriter) const override {

     auto reductionOp = cast<ReductionOp>(maskableOp.getOperation());

     auto kind = reductionOp.getKind();

     Type eltType = reductionOp.getDest().getType();

     Type llvmType = typeConverter->convertType(eltType);

     Value operand = reductionOp.getVector();

     Value acc = reductionOp.getAcc();

     Location loc = reductionOp.getLoc();


     arith::FastMathFlagsAttr fMFAttr = reductionOp.getFastMathFlagsAttr();

     LLVM::FastmathFlagsAttr fmf = LLVM::FastmathFlagsAttr::get(

         reductionOp.getContext(),

         convertArithFastMathFlagsToLLVM(fMFAttr.getValue()));


     Value result;

     switch (kind) {

     case vector::CombiningKind::ADD:

       result = lowerPredicatedReductionWithStartValue<

           LLVM::VPReduceAddOp, ReductionNeutralZero, LLVM::VPReduceFAddOp,

           ReductionNeutralZero>(rewriter, loc, llvmType, operand, acc,

                                 maskOp.getMask());

       break;

     case vector::CombiningKind::MUL:

       result = lowerPredicatedReductionWithStartValue<

           LLVM::VPReduceMulOp, ReductionNeutralIntOne, LLVM::VPReduceFMulOp,

           ReductionNeutralFPOne>(rewriter, loc, llvmType, operand, acc,

                                  maskOp.getMask());

       break;

     case vector::CombiningKind::MINUI:

       result = lowerPredicatedReductionWithStartValue<LLVM::VPReduceUMinOp,

                                                       ReductionNeutralUIntMax>(

           rewriter, loc, llvmType, operand, acc, maskOp.getMask());

       break;

     case vector::CombiningKind::MINSI:

       result = lowerPredicatedReductionWithStartValue<LLVM::VPReduceSMinOp,

                                                       ReductionNeutralSIntMax>(

           rewriter, loc, llvmType, operand, acc, maskOp.getMask());

       break;

     case vector::CombiningKind::MAXUI:

       result = lowerPredicatedReductionWithStartValue<LLVM::VPReduceUMaxOp,

                                                       ReductionNeutralUIntMin>(

           rewriter, loc, llvmType, operand, acc, maskOp.getMask());

       break;

     case vector::CombiningKind::MAXSI:

       result = lowerPredicatedReductionWithStartValue<LLVM::VPReduceSMaxOp,

                                                       ReductionNeutralSIntMin>(

           rewriter, loc, llvmType, operand, acc, maskOp.getMask());

       break;

     case vector::CombiningKind::AND:

       result = lowerPredicatedReductionWithStartValue<LLVM::VPReduceAndOp,

                                                       ReductionNeutralAllOnes>(

           rewriter, loc, llvmType, operand, acc, maskOp.getMask());

       break;

     case vector::CombiningKind::OR:

       result = lowerPredicatedReductionWithStartValue<LLVM::VPReduceOrOp,

                                                       ReductionNeutralZero>(

           rewriter, loc, llvmType, operand, acc, maskOp.getMask());

       break;

     case vector::CombiningKind::XOR:

       result = lowerPredicatedReductionWithStartValue<LLVM::VPReduceXorOp,

                                                       ReductionNeutralZero>(

           rewriter, loc, llvmType, operand, acc, maskOp.getMask());

       break;

     case vector::CombiningKind::MINNUMF:

       result = lowerPredicatedReductionWithStartValue<LLVM::VPReduceFMinOp,

                                                       ReductionNeutralFPMax>(

           rewriter, loc, llvmType, operand, acc, maskOp.getMask());

       break;

     case vector::CombiningKind::MAXNUMF:

       result = lowerPredicatedReductionWithStartValue<LLVM::VPReduceFMaxOp,

                                                       ReductionNeutralFPMin>(

           rewriter, loc, llvmType, operand, acc, maskOp.getMask());

       break;

     case CombiningKind::MAXIMUMF:

       result = lowerMaskedReductionWithRegular<LLVM::vector_reduce_fmaximum,

                                                MaskNeutralFMaximum>(

           rewriter, loc, llvmType, operand, acc, maskOp.getMask(), fmf);

       break;

     case CombiningKind::MINIMUMF:

       result = lowerMaskedReductionWithRegular<LLVM::vector_reduce_fminimum,

                                                MaskNeutralFMinimum>(

           rewriter, loc, llvmType, operand, acc, maskOp.getMask(), fmf);

       break;

     }


     // Replace `vector.mask` operation altogether.

     rewriter.replaceOp(maskOp, result);

     return success();

   }

 };


 class VectorShuffleOpConversion

     : public ConvertOpToLLVMPattern<vector::ShuffleOp> {

 public:

   using ConvertOpToLLVMPattern<vector::ShuffleOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::ShuffleOp shuffleOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto loc = shuffleOp->getLoc();

     auto v1Type = shuffleOp.getV1VectorType();

     auto v2Type = shuffleOp.getV2VectorType();

     auto vectorType = shuffleOp.getResultVectorType();

     Type llvmType = typeConverter->convertType(vectorType);

     ArrayRef<int64_t> mask = shuffleOp.getMask();


     // Bail if result type cannot be lowered.

     if (!llvmType)

       return failure();


     // Get rank and dimension sizes.

     int64_t rank = vectorType.getRank();

 #ifndef NDEBUG

     bool wellFormed0DCase =

         v1Type.getRank() == 0 && v2Type.getRank() == 0 && rank == 1;

     bool wellFormedNDCase =

         v1Type.getRank() == rank && v2Type.getRank() == rank;

     assert((wellFormed0DCase || wellFormedNDCase) && "op is not well-formed");

 #endif


     // For rank 0 and 1, where both operands have *exactly* the same vector

     // type, there is direct shuffle support in LLVM. Use it!

     if (rank <= 1 && v1Type == v2Type) {

       Value llvmShuffleOp = rewriter.create<LLVM::ShuffleVectorOp>(

           loc, adaptor.getV1(), adaptor.getV2(),

           llvm::to_vector_of<int32_t>(mask));

       rewriter.replaceOp(shuffleOp, llvmShuffleOp);

       return success();

     }


     // For all other cases, insert the individual values individually.

     int64_t v1Dim = v1Type.getDimSize(0);

     Type eltType;

     if (auto arrayType = dyn_cast<LLVM::LLVMArrayType>(llvmType))

       eltType = arrayType.getElementType();

     else

       eltType = cast<VectorType>(llvmType).getElementType();

     Value insert = rewriter.create<LLVM::PoisonOp>(loc, llvmType);

     int64_t insPos = 0;

     for (int64_t extPos : mask) {

       Value value = adaptor.getV1();

       if (extPos >= v1Dim) {

         extPos -= v1Dim;

         value = adaptor.getV2();

       }

       Value extract = extractOne(rewriter, *getTypeConverter(), loc, value,

                                  eltType, rank, extPos);

       insert = insertOne(rewriter, *getTypeConverter(), loc, insert, extract,

                          llvmType, rank, insPos++);

     }

     rewriter.replaceOp(shuffleOp, insert);

     return success();

   }

 };


 class VectorExtractElementOpConversion

     : public ConvertOpToLLVMPattern<vector::ExtractElementOp> {

 public:

   using ConvertOpToLLVMPattern<

       vector::ExtractElementOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::ExtractElementOp extractEltOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto vectorType = extractEltOp.getSourceVectorType();

     auto llvmType = typeConverter->convertType(vectorType.getElementType());


     // Bail if result type cannot be lowered.

     if (!llvmType)

       return failure();


     if (vectorType.getRank() == 0) {

       Location loc = extractEltOp.getLoc();

       auto idxType = rewriter.getIndexType();

       auto zero = rewriter.create<LLVM::ConstantOp>(

           loc, typeConverter->convertType(idxType),

           rewriter.getIntegerAttr(idxType, 0));

       rewriter.replaceOpWithNewOp<LLVM::ExtractElementOp>(

           extractEltOp, llvmType, adaptor.getVector(), zero);

       return success();

     }


     rewriter.replaceOpWithNewOp<LLVM::ExtractElementOp>(

         extractEltOp, llvmType, adaptor.getVector(), adaptor.getPosition());

     return success();

   }

 };


 class VectorExtractOpConversion

     : public ConvertOpToLLVMPattern<vector::ExtractOp> {

 public:

   using ConvertOpToLLVMPattern<vector::ExtractOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::ExtractOp extractOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto loc = extractOp->getLoc();

     auto resultType = extractOp.getResult().getType();

     auto llvmResultType = typeConverter->convertType(resultType);

     // Bail if result type cannot be lowered.

     if (!llvmResultType)

       return failure();


     SmallVector<OpFoldResult> positionVec = getMixedValues(

         adaptor.getStaticPosition(), adaptor.getDynamicPosition(), rewriter);


     // The Vector -> LLVM lowering models N-D vectors as nested aggregates of

     // 1-d vectors. This nesting is modeled using arrays. We do this conversion

     // from a N-d vector extract to a nested aggregate vector extract in two

     // steps:

     //  - Extract a member from the nested aggregate. The result can be

     //    a lower rank nested aggregate or a vector (1-D). This is done using

     //    `llvm.extractvalue`.

     //  - Extract a scalar out of the vector if needed. This is done using

     //   `llvm.extractelement`.


     // Determine if we need to extract a member out of the aggregate. We

     // always need to extract a member if the input rank >= 2.

     bool extractsAggregate = extractOp.getSourceVectorType().getRank() >= 2;

     // Determine if we need to extract a scalar as the result. We extract

     // a scalar if the extract is full rank, i.e., the number of indices is

     // equal to source vector rank.

     bool extractsScalar = static_cast<int64_t>(positionVec.size()) ==

                           extractOp.getSourceVectorType().getRank();


     // Since the LLVM type converter converts 0-d vectors to 1-d vectors, we

     // need to add a position for this change.

     if (extractOp.getSourceVectorType().getRank() == 0) {

       Type idxType = typeConverter->convertType(rewriter.getIndexType());

       positionVec.push_back(rewriter.getZeroAttr(idxType));

     }


     Value extracted = adaptor.getVector();

     if (extractsAggregate) {

       ArrayRef<OpFoldResult> position(positionVec);

       if (extractsScalar) {

         // If we are extracting a scalar from the extracted member, we drop

         // the last index, which will be used to extract the scalar out of the

         // vector.

         position = position.drop_back();

       }

       // llvm.extractvalue does not support dynamic dimensions.

       if (!llvm::all_of(position, llvm::IsaPred<Attribute>)) {

         return failure();

       }

       extracted = rewriter.create<LLVM::ExtractValueOp>(

           loc, extracted, getAsIntegers(position));

     }


     if (extractsScalar) {

       extracted = rewriter.create<LLVM::ExtractElementOp>(

           loc, extracted, getAsLLVMValue(rewriter, loc, positionVec.back()));

     }


     rewriter.replaceOp(extractOp, extracted);

     return success();

   }

 };


 /// Conversion pattern that turns a vector.fma on a 1-D vector

 /// into an llvm.intr.fmuladd. This is a trivial 1-1 conversion.

 /// This does not match vectors of n >= 2 rank.

 ///

 /// Example:

 /// ```

 ///  vector.fma %a, %a, %a : vector<8xf32>

 /// ```

 /// is converted to:

 /// ```

 ///  llvm.intr.fmuladd %va, %va, %va:

 ///    (!llvm."<8 x f32>">, !llvm<"<8 x f32>">, !llvm<"<8 x f32>">)

 ///    -> !llvm."<8 x f32>">

 /// ```

 class VectorFMAOp1DConversion : public ConvertOpToLLVMPattern<vector::FMAOp> {

 public:

   using ConvertOpToLLVMPattern<vector::FMAOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::FMAOp fmaOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     VectorType vType = fmaOp.getVectorType();

     if (vType.getRank() > 1)

       return failure();


     rewriter.replaceOpWithNewOp<LLVM::FMulAddOp>(

         fmaOp, adaptor.getLhs(), adaptor.getRhs(), adaptor.getAcc());

     return success();

   }

 };


 class VectorInsertElementOpConversion

     : public ConvertOpToLLVMPattern<vector::InsertElementOp> {

 public:

   using ConvertOpToLLVMPattern<vector::InsertElementOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::InsertElementOp insertEltOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto vectorType = insertEltOp.getDestVectorType();

     auto llvmType = typeConverter->convertType(vectorType);


     // Bail if result type cannot be lowered.

     if (!llvmType)

       return failure();


     if (vectorType.getRank() == 0) {

       Location loc = insertEltOp.getLoc();

       auto idxType = rewriter.getIndexType();

       auto zero = rewriter.create<LLVM::ConstantOp>(

           loc, typeConverter->convertType(idxType),

           rewriter.getIntegerAttr(idxType, 0));

       rewriter.replaceOpWithNewOp<LLVM::InsertElementOp>(

           insertEltOp, llvmType, adaptor.getDest(), adaptor.getSource(), zero);

       return success();

     }


     rewriter.replaceOpWithNewOp<LLVM::InsertElementOp>(

         insertEltOp, llvmType, adaptor.getDest(), adaptor.getSource(),

         adaptor.getPosition());

     return success();

   }

 };


 class VectorInsertOpConversion

     : public ConvertOpToLLVMPattern<vector::InsertOp> {

 public:

   using ConvertOpToLLVMPattern<vector::InsertOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::InsertOp insertOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto loc = insertOp->getLoc();

     auto destVectorType = insertOp.getDestVectorType();

     auto llvmResultType = typeConverter->convertType(destVectorType);

     // Bail if result type cannot be lowered.

     if (!llvmResultType)

       return failure();


     SmallVector<OpFoldResult> positionVec = getMixedValues(

         adaptor.getStaticPosition(), adaptor.getDynamicPosition(), rewriter);


     // The logic in this pattern mirrors VectorExtractOpConversion. Refer to

     // its explanatory comment about how N-D vectors are converted as nested

     // aggregates (llvm.array's) of 1D vectors.

     //

     // The innermost dimension of the destination vector, when converted to a

     // nested aggregate form, will always be a 1D vector.

     //

     // * If the insertion is happening into the innermost dimension of the

     //   destination vector:

     //   - If the destination is a nested aggregate, extract a 1D vector out of

     //     the aggregate. This can be done using llvm.extractvalue. The

     //     destination is now guaranteed to be a 1D vector, to which we are

     //     inserting.

     //   - Do the insertion into the 1D destination vector, and make the result

     //     the new source nested aggregate. This can be done using

     //     llvm.insertelement.

     // * Insert the source nested aggregate into the destination nested

     //   aggregate.


     // Determine if we need to extract/insert a 1D vector out of the aggregate.

     bool isNestedAggregate = isa<LLVM::LLVMArrayType>(llvmResultType);

     // Determine if we need to insert a scalar into the 1D vector.

     bool insertIntoInnermostDim =

         static_cast<int64_t>(positionVec.size()) == destVectorType.getRank();


     ArrayRef<OpFoldResult> positionOf1DVectorWithinAggregate(

         positionVec.begin(),

         insertIntoInnermostDim ? positionVec.size() - 1 : positionVec.size());

     OpFoldResult positionOfScalarWithin1DVector;

     if (destVectorType.getRank() == 0) {

       // Since the LLVM type converter converts 0D vectors to 1D vectors, we

       // need to create a 0 here as the position into the 1D vector.

       Type idxType = typeConverter->convertType(rewriter.getIndexType());

       positionOfScalarWithin1DVector = rewriter.getZeroAttr(idxType);

     } else if (insertIntoInnermostDim) {

       positionOfScalarWithin1DVector = positionVec.back();

     }


     // We are going to mutate this 1D vector until it is either the final

     // result (in the non-aggregate case) or the value that needs to be

     // inserted into the aggregate result.

     Value sourceAggregate = adaptor.getValueToStore();

     if (insertIntoInnermostDim) {

       // Scalar-into-1D-vector case, so we know we will have to create a

       // InsertElementOp. The question is into what destination.

       if (isNestedAggregate) {

         // Aggregate case: the destination for the InsertElementOp needs to be

         // extracted from the aggregate.

         if (!llvm::all_of(positionOf1DVectorWithinAggregate,

                           llvm::IsaPred<Attribute>)) {

           // llvm.extractvalue does not support dynamic dimensions.

           return failure();

         }

         sourceAggregate = rewriter.create<LLVM::ExtractValueOp>(

             loc, adaptor.getDest(),

             getAsIntegers(positionOf1DVectorWithinAggregate));

       } else {

         // No-aggregate case. The destination for the InsertElementOp is just

         // the insertOp's destination.

         sourceAggregate = adaptor.getDest();

       }

       // Insert the scalar into the 1D vector.

       sourceAggregate = rewriter.create<LLVM::InsertElementOp>(

           loc, sourceAggregate.getType(), sourceAggregate,

           adaptor.getValueToStore(),

           getAsLLVMValue(rewriter, loc, positionOfScalarWithin1DVector));

     }


     Value result = sourceAggregate;

     if (isNestedAggregate) {

       result = rewriter.create<LLVM::InsertValueOp>(

           loc, adaptor.getDest(), sourceAggregate,

           getAsIntegers(positionOf1DVectorWithinAggregate));

     }


     rewriter.replaceOp(insertOp, result);

     return success();

   }

 };


 /// Lower vector.scalable.insert ops to LLVM vector.insert

 struct VectorScalableInsertOpLowering

     : public ConvertOpToLLVMPattern<vector::ScalableInsertOp> {

   using ConvertOpToLLVMPattern<

       vector::ScalableInsertOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::ScalableInsertOp insOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     rewriter.replaceOpWithNewOp<LLVM::vector_insert>(

         insOp, adaptor.getDest(), adaptor.getValueToStore(), adaptor.getPos());

     return success();

   }

 };


 /// Lower vector.scalable.extract ops to LLVM vector.extract

 struct VectorScalableExtractOpLowering

     : public ConvertOpToLLVMPattern<vector::ScalableExtractOp> {

   using ConvertOpToLLVMPattern<

       vector::ScalableExtractOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::ScalableExtractOp extOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     rewriter.replaceOpWithNewOp<LLVM::vector_extract>(

         extOp, typeConverter->convertType(extOp.getResultVectorType()),

         adaptor.getSource(), adaptor.getPos());

     return success();

   }

 };


 /// Rank reducing rewrite for n-D FMA into (n-1)-D FMA where n > 1.

 ///

 /// Example:

 /// ```

 ///   %d = vector.fma %a, %b, %c : vector<2x4xf32>

 /// ```

 /// is rewritten into:

 /// ```

 ///  %r = splat %f0: vector<2x4xf32>

 ///  %va = vector.extractvalue %a[0] : vector<2x4xf32>

 ///  %vb = vector.extractvalue %b[0] : vector<2x4xf32>

 ///  %vc = vector.extractvalue %c[0] : vector<2x4xf32>

 ///  %vd = vector.fma %va, %vb, %vc : vector<4xf32>

 ///  %r2 = vector.insertvalue %vd, %r[0] : vector<4xf32> into vector<2x4xf32>

 ///  %va2 = vector.extractvalue %a2[1] : vector<2x4xf32>

 ///  %vb2 = vector.extractvalue %b2[1] : vector<2x4xf32>

 ///  %vc2 = vector.extractvalue %c2[1] : vector<2x4xf32>

 ///  %vd2 = vector.fma %va2, %vb2, %vc2 : vector<4xf32>

 ///  %r3 = vector.insertvalue %vd2, %r2[1] : vector<4xf32> into vector<2x4xf32>

 ///  // %r3 holds the final value.

 /// ```

 class VectorFMAOpNDRewritePattern : public OpRewritePattern<FMAOp> {

 public:

   using OpRewritePattern<FMAOp>::OpRewritePattern;


   void initialize() {

     // This pattern recursively unpacks one dimension at a time. The recursion

     // bounded as the rank is strictly decreasing.

     setHasBoundedRewriteRecursion();

   }


   LogicalResult matchAndRewrite(FMAOp op,

                                 PatternRewriter &rewriter) const override {

     auto vType = op.getVectorType();

     if (vType.getRank() < 2)

       return failure();


     auto loc = op.getLoc();

     auto elemType = vType.getElementType();

     Value zero = rewriter.create<arith::ConstantOp>(

         loc, elemType, rewriter.getZeroAttr(elemType));

     Value desc = rewriter.create<vector::SplatOp>(loc, vType, zero);

     for (int64_t i = 0, e = vType.getShape().front(); i != e; ++i) {

       Value extrLHS = rewriter.create<ExtractOp>(loc, op.getLhs(), i);

       Value extrRHS = rewriter.create<ExtractOp>(loc, op.getRhs(), i);

       Value extrACC = rewriter.create<ExtractOp>(loc, op.getAcc(), i);

       Value fma = rewriter.create<FMAOp>(loc, extrLHS, extrRHS, extrACC);

       desc = rewriter.create<InsertOp>(loc, fma, desc, i);

     }

     rewriter.replaceOp(op, desc);

     return success();

   }

 };


 /// Returns the strides if the memory underlying `memRefType` has a contiguous

 /// static layout.

 static std::optional<SmallVector<int64_t, 4>>

 computeContiguousStrides(MemRefType memRefType) {

   int64_t offset;

   SmallVector<int64_t, 4> strides;

   if (failed(memRefType.getStridesAndOffset(strides, offset)))

     return std::nullopt;

   if (!strides.empty() && strides.back() != 1)

     return std::nullopt;

   // If no layout or identity layout, this is contiguous by definition.

   if (memRefType.getLayout().isIdentity())

     return strides;


   // Otherwise, we must determine contiguity form shapes. This can only ever

   // work in static cases because MemRefType is underspecified to represent

   // contiguous dynamic shapes in other ways than with just empty/identity

   // layout.

   auto sizes = memRefType.getShape();

   for (int index = 0, e = strides.size() - 1; index < e; ++index) {

     if (ShapedType::isDynamic(sizes[index + 1]) ||

         ShapedType::isDynamic(strides[index]) ||

         ShapedType::isDynamic(strides[index + 1]))

       return std::nullopt;

     if (strides[index] != strides[index + 1] * sizes[index + 1])

       return std::nullopt;

   }

   return strides;

 }


 class VectorTypeCastOpConversion

     : public ConvertOpToLLVMPattern<vector::TypeCastOp> {

 public:

   using ConvertOpToLLVMPattern<vector::TypeCastOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::TypeCastOp castOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto loc = castOp->getLoc();

     MemRefType sourceMemRefType =

         cast<MemRefType>(castOp.getOperand().getType());

     MemRefType targetMemRefType = castOp.getType();


     // Only static shape casts supported atm.

     if (!sourceMemRefType.hasStaticShape() ||

         !targetMemRefType.hasStaticShape())

       return failure();


     auto llvmSourceDescriptorTy =

         dyn_cast<LLVM::LLVMStructType>(adaptor.getOperands()[0].getType());

     if (!llvmSourceDescriptorTy)

       return failure();

     MemRefDescriptor sourceMemRef(adaptor.getOperands()[0]);


     auto llvmTargetDescriptorTy = dyn_cast_or_null<LLVM::LLVMStructType>(

         typeConverter->convertType(targetMemRefType));

     if (!llvmTargetDescriptorTy)

       return failure();


     // Only contiguous source buffers supported atm.

     auto sourceStrides = computeContiguousStrides(sourceMemRefType);

     if (!sourceStrides)

       return failure();

     auto targetStrides = computeContiguousStrides(targetMemRefType);

     if (!targetStrides)

       return failure();

     // Only support static strides for now, regardless of contiguity.

     if (llvm::any_of(*targetStrides, ShapedType::isDynamic))

       return failure();


     auto int64Ty = IntegerType::get(rewriter.getContext(), 64);


     // Create descriptor.

     auto desc = MemRefDescriptor::poison(rewriter, loc, llvmTargetDescriptorTy);

     // Set allocated ptr.

     Value allocated = sourceMemRef.allocatedPtr(rewriter, loc);

     desc.setAllocatedPtr(rewriter, loc, allocated);


     // Set aligned ptr.

     Value ptr = sourceMemRef.alignedPtr(rewriter, loc);

     desc.setAlignedPtr(rewriter, loc, ptr);

     // Fill offset 0.

     auto attr = rewriter.getIntegerAttr(rewriter.getIndexType(), 0);

     auto zero = rewriter.create<LLVM::ConstantOp>(loc, int64Ty, attr);

     desc.setOffset(rewriter, loc, zero);


     // Fill size and stride descriptors in memref.

     for (const auto &indexedSize :

          llvm::enumerate(targetMemRefType.getShape())) {

       int64_t index = indexedSize.index();

       auto sizeAttr =

           rewriter.getIntegerAttr(rewriter.getIndexType(), indexedSize.value());

       auto size = rewriter.create<LLVM::ConstantOp>(loc, int64Ty, sizeAttr);

       desc.setSize(rewriter, loc, index, size);

       auto strideAttr = rewriter.getIntegerAttr(rewriter.getIndexType(),

                                                 (*targetStrides)[index]);

       auto stride = rewriter.create<LLVM::ConstantOp>(loc, int64Ty, strideAttr);

       desc.setStride(rewriter, loc, index, stride);

     }


     rewriter.replaceOp(castOp, {desc});

     return success();

   }

 };


 /// Conversion pattern for a `vector.create_mask` (1-D scalable vectors only).

 /// Non-scalable versions of this operation are handled in Vector Transforms.

 class VectorCreateMaskOpConversion

     : public OpConversionPattern<vector::CreateMaskOp> {

 public:

   explicit VectorCreateMaskOpConversion(MLIRContext *context,

                                         bool enableIndexOpt)

       : OpConversionPattern<vector::CreateMaskOp>(context),

         force32BitVectorIndices(enableIndexOpt) {}


   LogicalResult

   matchAndRewrite(vector::CreateMaskOp op, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto dstType = op.getType();

     if (dstType.getRank() != 1 || !cast<VectorType>(dstType).isScalable())

       return failure();

     IntegerType idxType =

         force32BitVectorIndices ? rewriter.getI32Type() : rewriter.getI64Type();

     auto loc = op->getLoc();

     Value indices = rewriter.create<LLVM::StepVectorOp>(

         loc, LLVM::getVectorType(idxType, dstType.getShape()[0],

                                  /*isScalable=*/true));

     auto bound = getValueOrCreateCastToIndexLike(rewriter, loc, idxType,

                                                  adaptor.getOperands()[0]);

     Value bounds = rewriter.create<SplatOp>(loc, indices.getType(), bound);

     Value comp = rewriter.create<arith::CmpIOp>(loc, arith::CmpIPredicate::slt,

                                                 indices, bounds);

     rewriter.replaceOp(op, comp);

     return success();

   }


 private:

   const bool force32BitVectorIndices;

 };


 class VectorPrintOpConversion : public ConvertOpToLLVMPattern<vector::PrintOp> {

 public:

   using ConvertOpToLLVMPattern<vector::PrintOp>::ConvertOpToLLVMPattern;


   // Lowering implementation that relies on a small runtime support library,

   // which only needs to provide a few printing methods (single value for all

   // data types, opening/closing bracket, comma, newline). The lowering splits

   // the vector into elementary printing operations. The advantage of this

   // approach is that the library can remain unaware of all low-level

   // implementation details of vectors while still supporting output of any

   // shaped and dimensioned vector.

   //

   // Note: This lowering only handles scalars, n-D vectors are broken into

   // printing scalars in loops in VectorToSCF.

   //

   // TODO: rely solely on libc in future? something else?

   //

   LogicalResult

   matchAndRewrite(vector::PrintOp printOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto parent = printOp->getParentOfType<ModuleOp>();

     if (!parent)

       return failure();


     auto loc = printOp->getLoc();


     if (auto value = adaptor.getSource()) {

       Type printType = printOp.getPrintType();

       if (isa<VectorType>(printType)) {

         // Vectors should be broken into elementary print ops in VectorToSCF.

         return failure();

       }

       if (failed(emitScalarPrint(rewriter, parent, loc, printType, value)))

         return failure();

     }


     auto punct = printOp.getPunctuation();

     if (auto stringLiteral = printOp.getStringLiteral()) {

       auto createResult =

           LLVM::createPrintStrCall(rewriter, loc, parent, "vector_print_str",

                                    *stringLiteral, *getTypeConverter(),

                                    /*addNewline=*/false);

       if (createResult.failed())

         return failure();


     } else if (punct != PrintPunctuation::NoPunctuation) {

       FailureOr<LLVM::LLVMFuncOp> op = [&]() {

         switch (punct) {

         case PrintPunctuation::Close:

           return LLVM::lookupOrCreatePrintCloseFn(rewriter, parent);

         case PrintPunctuation::Open:

           return LLVM::lookupOrCreatePrintOpenFn(rewriter, parent);

         case PrintPunctuation::Comma:

           return LLVM::lookupOrCreatePrintCommaFn(rewriter, parent);

         case PrintPunctuation::NewLine:

           return LLVM::lookupOrCreatePrintNewlineFn(rewriter, parent);

         default:

           llvm_unreachable("unexpected punctuation");

         }

       }();

       if (failed(op))

         return failure();

       emitCall(rewriter, printOp->getLoc(), op.value());

     }


     rewriter.eraseOp(printOp);

     return success();

   }


 private:

   enum class PrintConversion {

     // clang-format off

     None,

     ZeroExt64,

     SignExt64,

     Bitcast16

     // clang-format on

   };


   LogicalResult emitScalarPrint(ConversionPatternRewriter &rewriter,

                                 ModuleOp parent, Location loc, Type printType,

                                 Value value) const {

     if (typeConverter->convertType(printType) == nullptr)

       return failure();


     // Make sure element type has runtime support.

     PrintConversion conversion = PrintConversion::None;

     FailureOr<Operation *> printer;

     if (printType.isF32()) {

       printer = LLVM::lookupOrCreatePrintF32Fn(rewriter, parent);

     } else if (printType.isF64()) {

       printer = LLVM::lookupOrCreatePrintF64Fn(rewriter, parent);

     } else if (printType.isF16()) {

       conversion = PrintConversion::Bitcast16; // bits!

       printer = LLVM::lookupOrCreatePrintF16Fn(rewriter, parent);

     } else if (printType.isBF16()) {

       conversion = PrintConversion::Bitcast16; // bits!

       printer = LLVM::lookupOrCreatePrintBF16Fn(rewriter, parent);

     } else if (printType.isIndex()) {

       printer = LLVM::lookupOrCreatePrintU64Fn(rewriter, parent);

     } else if (auto intTy = dyn_cast<IntegerType>(printType)) {

       // Integers need a zero or sign extension on the operand

       // (depending on the source type) as well as a signed or

       // unsigned print method. Up to 64-bit is supported.

       unsigned width = intTy.getWidth();

       if (intTy.isUnsigned()) {

         if (width <= 64) {

           if (width < 64)

             conversion = PrintConversion::ZeroExt64;

           printer = LLVM::lookupOrCreatePrintU64Fn(rewriter, parent);

         } else {

           return failure();

         }

       } else {

         assert(intTy.isSignless() || intTy.isSigned());

         if (width <= 64) {

           // Note that we *always* zero extend booleans (1-bit integers),

           // so that true/false is printed as 1/0 rather than -1/0.

           if (width == 1)

             conversion = PrintConversion::ZeroExt64;

           else if (width < 64)

             conversion = PrintConversion::SignExt64;

           printer = LLVM::lookupOrCreatePrintI64Fn(rewriter, parent);

         } else {

           return failure();

         }

       }

     } else {

       return failure();

     }

     if (failed(printer))

       return failure();


     switch (conversion) {

     case PrintConversion::ZeroExt64:

       value = rewriter.create<arith::ExtUIOp>(

           loc, IntegerType::get(rewriter.getContext(), 64), value);

       break;

     case PrintConversion::SignExt64:

       value = rewriter.create<arith::ExtSIOp>(

           loc, IntegerType::get(rewriter.getContext(), 64), value);

       break;

     case PrintConversion::Bitcast16:

       value = rewriter.create<LLVM::BitcastOp>(

           loc, IntegerType::get(rewriter.getContext(), 16), value);

       break;

     case PrintConversion::None:

       break;

     }

     emitCall(rewriter, loc, printer.value(), value);

     return success();

   }


   // Helper to emit a call.

   static void emitCall(ConversionPatternRewriter &rewriter, Location loc,

                        Operation *ref, ValueRange params = ValueRange()) {

     rewriter.create<LLVM::CallOp>(loc, TypeRange(), SymbolRefAttr::get(ref),

                                   params);

   }

 };


 /// The Splat operation is lowered to an insertelement + a shufflevector

 /// operation. Splat to only 0-d and 1-d vector result types are lowered.

 struct VectorSplatOpLowering : public ConvertOpToLLVMPattern<vector::SplatOp> {

   using ConvertOpToLLVMPattern<vector::SplatOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::SplatOp splatOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     VectorType resultType = cast<VectorType>(splatOp.getType());

     if (resultType.getRank() > 1)

       return failure();


     // First insert it into a poison vector so we can shuffle it.

     auto vectorType = typeConverter->convertType(splatOp.getType());

     Value poison =

         rewriter.create<LLVM::PoisonOp>(splatOp.getLoc(), vectorType);

     auto zero = rewriter.create<LLVM::ConstantOp>(

         splatOp.getLoc(),

         typeConverter->convertType(rewriter.getIntegerType(32)),

         rewriter.getZeroAttr(rewriter.getIntegerType(32)));


     // For 0-d vector, we simply do `insertelement`.

     if (resultType.getRank() == 0) {

       rewriter.replaceOpWithNewOp<LLVM::InsertElementOp>(

           splatOp, vectorType, poison, adaptor.getInput(), zero);

       return success();

     }


     // For 1-d vector, we additionally do a `vectorshuffle`.

     auto v = rewriter.create<LLVM::InsertElementOp>(

         splatOp.getLoc(), vectorType, poison, adaptor.getInput(), zero);


     int64_t width = cast<VectorType>(splatOp.getType()).getDimSize(0);

     SmallVector<int32_t> zeroValues(width, 0);


     // Shuffle the value across the desired number of elements.

     rewriter.replaceOpWithNewOp<LLVM::ShuffleVectorOp>(splatOp, v, poison,

                                                        zeroValues);

     return success();

   }

 };


 /// The Splat operation is lowered to an insertelement + a shufflevector

 /// operation. Splat to only 2+-d vector result types are lowered by the

 /// SplatNdOpLowering, the 1-d case is handled by SplatOpLowering.

 struct VectorSplatNdOpLowering : public ConvertOpToLLVMPattern<SplatOp> {

   using ConvertOpToLLVMPattern<SplatOp>::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(SplatOp splatOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     VectorType resultType = splatOp.getType();

     if (resultType.getRank() <= 1)

       return failure();


     // First insert it into an undef vector so we can shuffle it.

     auto loc = splatOp.getLoc();

     auto vectorTypeInfo =

         LLVM::detail::extractNDVectorTypeInfo(resultType, *getTypeConverter());

     auto llvmNDVectorTy = vectorTypeInfo.llvmNDVectorTy;

     auto llvm1DVectorTy = vectorTypeInfo.llvm1DVectorTy;

     if (!llvmNDVectorTy || !llvm1DVectorTy)

       return failure();


     // Construct returned value.

     Value desc = rewriter.create<LLVM::PoisonOp>(loc, llvmNDVectorTy);


     // Construct a 1-D vector with the splatted value that we insert in all the

     // places within the returned descriptor.

     Value vdesc = rewriter.create<LLVM::PoisonOp>(loc, llvm1DVectorTy);

     auto zero = rewriter.create<LLVM::ConstantOp>(

         loc, typeConverter->convertType(rewriter.getIntegerType(32)),

         rewriter.getZeroAttr(rewriter.getIntegerType(32)));

     Value v = rewriter.create<LLVM::InsertElementOp>(loc, llvm1DVectorTy, vdesc,

                                                      adaptor.getInput(), zero);


     // Shuffle the value across the desired number of elements.

     int64_t width = resultType.getDimSize(resultType.getRank() - 1);

     SmallVector<int32_t> zeroValues(width, 0);

     v = rewriter.create<LLVM::ShuffleVectorOp>(loc, v, v, zeroValues);


     // Iterate of linear index, convert to coords space and insert splatted 1-D

     // vector in each position.

     nDVectorIterate(vectorTypeInfo, rewriter, [&](ArrayRef<int64_t> position) {

       desc = rewriter.create<LLVM::InsertValueOp>(loc, desc, v, position);

     });

     rewriter.replaceOp(splatOp, desc);

     return success();

   }

 };


 /// Conversion pattern for a `vector.interleave`.

 /// This supports fixed-sized vectors and scalable vectors.

 struct VectorInterleaveOpLowering

     : public ConvertOpToLLVMPattern<vector::InterleaveOp> {

   using ConvertOpToLLVMPattern::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::InterleaveOp interleaveOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     VectorType resultType = interleaveOp.getResultVectorType();

     // n-D interleaves should have been lowered already.

     if (resultType.getRank() != 1)

       return rewriter.notifyMatchFailure(interleaveOp,

                                          "InterleaveOp not rank 1");

     // If the result is rank 1, then this directly maps to LLVM.

     if (resultType.isScalable()) {

       rewriter.replaceOpWithNewOp<LLVM::vector_interleave2>(

           interleaveOp, typeConverter->convertType(resultType),

           adaptor.getLhs(), adaptor.getRhs());

       return success();

     }

     // Lower fixed-size interleaves to a shufflevector. While the

     // vector.interleave2 intrinsic supports fixed and scalable vectors, the

     // langref still recommends fixed-vectors use shufflevector, see:

     // https://llvm.org/docs/LangRef.html#id876.

     int64_t resultVectorSize = resultType.getNumElements();

     SmallVector<int32_t> interleaveShuffleMask;

     interleaveShuffleMask.reserve(resultVectorSize);

     for (int i = 0, end = resultVectorSize / 2; i < end; ++i) {

       interleaveShuffleMask.push_back(i);

       interleaveShuffleMask.push_back((resultVectorSize / 2) + i);

     }

     rewriter.replaceOpWithNewOp<LLVM::ShuffleVectorOp>(

         interleaveOp, adaptor.getLhs(), adaptor.getRhs(),

         interleaveShuffleMask);

     return success();

   }

 };


 /// Conversion pattern for a `vector.deinterleave`.

 /// This supports fixed-sized vectors and scalable vectors.

 struct VectorDeinterleaveOpLowering

     : public ConvertOpToLLVMPattern<vector::DeinterleaveOp> {

   using ConvertOpToLLVMPattern::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::DeinterleaveOp deinterleaveOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     VectorType resultType = deinterleaveOp.getResultVectorType();

     VectorType sourceType = deinterleaveOp.getSourceVectorType();

     auto loc = deinterleaveOp.getLoc();


     // Note: n-D deinterleave operations should be lowered to the 1-D before

     // converting to LLVM.

     if (resultType.getRank() != 1)

       return rewriter.notifyMatchFailure(deinterleaveOp,

                                          "DeinterleaveOp not rank 1");


     if (resultType.isScalable()) {

       auto llvmTypeConverter = this->getTypeConverter();

       auto deinterleaveResults = deinterleaveOp.getResultTypes();

       auto packedOpResults =

           llvmTypeConverter->packOperationResults(deinterleaveResults);

       auto intrinsic = rewriter.create<LLVM::vector_deinterleave2>(

           loc, packedOpResults, adaptor.getSource());


       auto evenResult = rewriter.create<LLVM::ExtractValueOp>(

           loc, intrinsic->getResult(0), 0);

       auto oddResult = rewriter.create<LLVM::ExtractValueOp>(

           loc, intrinsic->getResult(0), 1);


       rewriter.replaceOp(deinterleaveOp, ValueRange{evenResult, oddResult});

       return success();

     }

     // Lower fixed-size deinterleave to two shufflevectors. While the

     // vector.deinterleave2 intrinsic supports fixed and scalable vectors, the

     // langref still recommends fixed-vectors use shufflevector, see:

     // https://llvm.org/docs/LangRef.html#id889.

     int64_t resultVectorSize = resultType.getNumElements();

     SmallVector<int32_t> evenShuffleMask;

     SmallVector<int32_t> oddShuffleMask;


     evenShuffleMask.reserve(resultVectorSize);

     oddShuffleMask.reserve(resultVectorSize);


     for (int i = 0; i < sourceType.getNumElements(); ++i) {

       if (i % 2 == 0)

         evenShuffleMask.push_back(i);

       else

         oddShuffleMask.push_back(i);

     }


     auto poison = rewriter.create<LLVM::PoisonOp>(loc, sourceType);

     auto evenShuffle = rewriter.create<LLVM::ShuffleVectorOp>(

         loc, adaptor.getSource(), poison, evenShuffleMask);

     auto oddShuffle = rewriter.create<LLVM::ShuffleVectorOp>(

         loc, adaptor.getSource(), poison, oddShuffleMask);


     rewriter.replaceOp(deinterleaveOp, ValueRange{evenShuffle, oddShuffle});

     return success();

   }

 };


 /// Conversion pattern for a `vector.from_elements`.

 struct VectorFromElementsLowering

     : public ConvertOpToLLVMPattern<vector::FromElementsOp> {

   using ConvertOpToLLVMPattern::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::FromElementsOp fromElementsOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     Location loc = fromElementsOp.getLoc();

     VectorType vectorType = fromElementsOp.getType();

     // TODO: Multi-dimensional vectors lower to !llvm.array<... x vector<>>.

     // Such ops should be handled in the same way as vector.insert.

     if (vectorType.getRank() > 1)

       return rewriter.notifyMatchFailure(fromElementsOp,

                                          "rank > 1 vectors are not supported");

     Type llvmType = typeConverter->convertType(vectorType);

     Value result = rewriter.create<LLVM::PoisonOp>(loc, llvmType);

     for (auto [idx, val] : llvm::enumerate(adaptor.getElements()))

       result = rewriter.create<vector::InsertOp>(loc, val, result, idx);

     rewriter.replaceOp(fromElementsOp, result);

     return success();

   }

 };


 /// Conversion pattern for vector.step.

 struct VectorScalableStepOpLowering

     : public ConvertOpToLLVMPattern<vector::StepOp> {

   using ConvertOpToLLVMPattern::ConvertOpToLLVMPattern;


   LogicalResult

   matchAndRewrite(vector::StepOp stepOp, OpAdaptor adaptor,

                   ConversionPatternRewriter &rewriter) const override {

     auto resultType = cast<VectorType>(stepOp.getType());

     if (!resultType.isScalable()) {

       return failure();

     }

     Type llvmType = typeConverter->convertType(stepOp.getType());

     rewriter.replaceOpWithNewOp<LLVM::StepVectorOp>(stepOp, llvmType);

     return success();

   }

 };


 } // namespace


 void mlir::vector::populateVectorRankReducingFMAPattern(

     RewritePatternSet &patterns) {

   patterns.add<VectorFMAOpNDRewritePattern>(patterns.getContext());

 }


 /// Populate the given list with patterns that convert from Vector to LLVM.

 void mlir::populateVectorToLLVMConversionPatterns(

     const LLVMTypeConverter &converter, RewritePatternSet &patterns,

     bool reassociateFPReductions, bool force32BitVectorIndices,

     bool useVectorAlignment) {

   // This function populates only ConversionPatterns, not RewritePatterns.

   MLIRContext *ctx = converter.getDialect()->getContext();

   patterns.add<VectorReductionOpConversion>(converter, reassociateFPReductions);

   patterns.add<VectorCreateMaskOpConversion>(ctx, force32BitVectorIndices);

   patterns.add<VectorLoadStoreConversion<vector::LoadOp>,

                VectorLoadStoreConversion<vector::MaskedLoadOp>,

                VectorLoadStoreConversion<vector::StoreOp>,

                VectorLoadStoreConversion<vector::MaskedStoreOp>,

                VectorGatherOpConversion, VectorScatterOpConversion>(

       converter, useVectorAlignment);

   patterns.add<VectorBitCastOpConversion, VectorShuffleOpConversion,

                VectorExtractElementOpConversion, VectorExtractOpConversion,

                VectorFMAOp1DConversion, VectorInsertElementOpConversion,

                VectorInsertOpConversion, VectorPrintOpConversion,

                VectorTypeCastOpConversion, VectorScaleOpConversion,

                VectorExpandLoadOpConversion, VectorCompressStoreOpConversion,

                VectorSplatOpLowering, VectorSplatNdOpLowering,

                VectorScalableInsertOpLowering, VectorScalableExtractOpLowering,

                MaskedReductionOpConversion, VectorInterleaveOpLowering,

                VectorDeinterleaveOpLowering, VectorFromElementsLowering,

                VectorScalableStepOpLowering>(converter);

 }


 void mlir::populateVectorToLLVMMatrixConversionPatterns(

     const LLVMTypeConverter &converter, RewritePatternSet &patterns) {

   patterns.add<VectorMatmulOpConversion>(converter);

   patterns.add<VectorFlatTransposeOpConversion>(converter);

 }


 namespace {

 struct VectorToLLVMDialectInterface : public ConvertToLLVMPatternInterface {

   using ConvertToLLVMPatternInterface::ConvertToLLVMPatternInterface;

   void loadDependentDialects(MLIRContext *context) const final {

     context->loadDialect<LLVM::LLVMDialect>();

   }


   /// Hook for derived dialect interface to provide conversion patterns

   /// and mark dialect legal for the conversion target.

   void populateConvertToLLVMConversionPatterns(

       ConversionTarget &target, LLVMTypeConverter &typeConverter,

       RewritePatternSet &patterns) const final {

     populateVectorToLLVMConversionPatterns(typeConverter, patterns);

   }

 };

 } // namespace


 void mlir::vector::registerConvertVectorToLLVMInterface(

     DialectRegistry &registry) {

   registry.addExtension(+[](MLIRContext *ctx, vector::VectorDialect *dialect) {

     dialect->addInterfaces<VectorToLLVMDialectInterface>();

   });

 }

AttrToLLVMConverter.h

BuiltinTypeInterfaces.h

getIndexedPtrs
static Value getIndexedPtrs(ConversionPatternRewriter &rewriter, Location loc, const LLVMTypeConverter &typeConverter, MemRefType memRefType, Value llvmMemref, Value base, Value index, VectorType vectorType)
Definition: ConvertVectorToLLVM.cpp:133

getVectorToLLVMAlignment
LogicalResult getVectorToLLVMAlignment(const LLVMTypeConverter &typeConverter, VectorType vectorType, MemRefType memrefType, unsigned &align, bool useVectorAlignment)
Definition: ConvertVectorToLLVM.cpp:106

getVectorAlignment
LogicalResult getVectorAlignment(const LLVMTypeConverter &typeConverter, VectorType vectorType, unsigned &align)
Definition: ConvertVectorToLLVM.cpp:71

getMemRefAlignment
LogicalResult getMemRefAlignment(const LLVMTypeConverter &typeConverter, MemRefType memrefType, unsigned &align)
Definition: ConvertVectorToLLVM.cpp:86

extractOne
static Value extractOne(ConversionPatternRewriter &rewriter, const LLVMTypeConverter &typeConverter, Location loc, Value val, Type llvmType, int64_t rank, int64_t pos)
Definition: ConvertVectorToLLVM.cpp:56

insertOne
static Value insertOne(ConversionPatternRewriter &rewriter, const LLVMTypeConverter &typeConverter, Location loc, Value val1, Value val2, Type llvmType, int64_t rank, int64_t pos)
Definition: ConvertVectorToLLVM.cpp:39

getAsLLVMValue
static Value getAsLLVMValue(OpBuilder &builder, Location loc, OpFoldResult foldResult)
Convert foldResult into a Value.
Definition: ConvertVectorToLLVM.cpp:151

isMemRefTypeSupported
static LogicalResult isMemRefTypeSupported(MemRefType memRefType, const LLVMTypeConverter &converter)
Definition: ConvertVectorToLLVM.cpp:123

ConvertVectorToLLVM.h

DialectConversion.h

Utils.h

FunctionCallUtils.h

LLVMDialect.h

kind
union mlir::linalg::@1197::ArityGroupAndKind::Kind kind

LoweringPatterns.h

MaskableOpInterface.h

None
@ None
Definition: MlirTblgenMain.cpp:28

PrintCallHelper.h

MINUI
#define MINUI(lhs, rhs)
Definition: SparseTensorIterator.cpp:37

ToLLVMInterface.h

TypeConverter.h

TypeToLLVM.h

TypeUtilities.h

printOp
static void printOp(llvm::raw_ostream &os, Operation *op, OpPrintingFlags &flags)
Definition: Unit.cpp:19

VectorOps.h

VectorPattern.h

VectorTransforms.h

llvm::ArrayRef
Definition: LLVM.h:48

llvm::SmallVector
Definition: LLVM.h:72

mlir::Builder::getI32IntegerAttr
IntegerAttr getI32IntegerAttr(int32_t value)
Definition: Builders.cpp:196

mlir::Builder::getIntegerAttr
IntegerAttr getIntegerAttr(Type type, int64_t value)
Definition: Builders.cpp:224

mlir::Builder::getFloatAttr
FloatAttr getFloatAttr(Type type, double value)
Definition: Builders.cpp:250

mlir::Builder::getI64Type
IntegerType getI64Type()
Definition: Builders.cpp:65

mlir::Builder::getI32Type
IntegerType getI32Type()
Definition: Builders.cpp:63

mlir::Builder::getIntegerType
IntegerType getIntegerType(unsigned width)
Definition: Builders.cpp:67

mlir::Builder::getZeroAttr
TypedAttr getZeroAttr(Type type)
Definition: Builders.cpp:320

mlir::Builder::getContext
MLIRContext * getContext() const
Definition: Builders.h:56

mlir::Builder::getIndexType
IndexType getIndexType()
Definition: Builders.cpp:51

mlir::ConversionPatternRewriter
This class implements a pattern rewriter for use with ConversionPatterns.
Definition: DialectConversion.h:726

mlir::ConversionPatternRewriter::replaceOp
void replaceOp(Operation *op, ValueRange newValues) override
Replace the given operation with the new values.
Definition: DialectConversion.cpp:1655

mlir::ConversionPatternRewriter::eraseOp
void eraseOp(Operation *op) override
PatternRewriter hook for erasing a dead operation.
Definition: DialectConversion.cpp:1680

mlir::ConversionTarget
This class describes a specific conversion target.
Definition: DialectConversion.h:868

mlir::ConvertOpToLLVMPattern
Utility class for operation conversions targeting the LLVM dialect that match exactly one source oper...
Definition: Pattern.h:155

mlir::ConvertOpToLLVMPattern::ConvertOpToLLVMPattern
ConvertOpToLLVMPattern(const LLVMTypeConverter &typeConverter, PatternBenefit benefit=1)
Definition: Pattern.h:161

mlir::ConvertToLLVMPatternInterface
Base class for dialect interfaces providing translation to LLVM IR.
Definition: ToLLVMInterface.h:31

mlir::ConvertToLLVMPatternInterface::ConvertToLLVMPatternInterface
ConvertToLLVMPatternInterface(Dialect *dialect)
Definition: ToLLVMInterface.h:33

mlir::DenseElementsAttr::get
static DenseElementsAttr get(ShapedType type, ArrayRef< Attribute > values)
Constructs a dense elements attribute from an array of element values.
Definition: BuiltinAttributes.cpp:911

mlir::DialectRegistry
The DialectRegistry maps a dialect namespace to a constructor for the matching dialect.
Definition: DialectRegistry.h:139

mlir::DialectRegistry::addExtension
bool addExtension(TypeID extensionID, std::unique_ptr< DialectExtensionBase > extension)
Add the given extension to the registry.
Definition: DialectRegistry.h:211

mlir::LLVMTypeConverter
Conversion from types to the LLVM IR dialect.
Definition: TypeConverter.h:35

mlir::LLVMTypeConverter::getDialect
LLVM::LLVMDialect * getDialect() const
Returns the LLVM dialect.
Definition: TypeConverter.h:105

mlir::LLVMTypeConverter::convertType
LogicalResult convertType(Type t, SmallVectorImpl< Type > &results) const
Convert the given type.
Definition: DialectConversion.cpp:2850

mlir::LLVMTypeConverter::getMemRefAddressSpace
FailureOr< unsigned > getMemRefAddressSpace(BaseMemRefType type) const
Return the LLVM address space corresponding to the memory space of the memref type type or failure if...
Definition: TypeConverter.cpp:575

mlir::LLVMTypeConverter::getDataLayout
const llvm::DataLayout & getDataLayout() const
Returns the data layout to use during and after conversion.
Definition: TypeConverter.h:131

mlir::LLVM::TypeToLLVMIRTranslator
Utility class to translate MLIR LLVM dialect types to LLVM IR.
Definition: TypeToLLVM.h:39

mlir::LLVM::TypeToLLVMIRTranslator::getPreferredAlignment
unsigned getPreferredAlignment(Type type, const llvm::DataLayout &layout)
Returns the preferred alignment for the type given the data layout.
Definition: TypeToLLVM.cpp:183

mlir::Location
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
Definition: Location.h:66

mlir::MLIRContext
MLIRContext is the top-level object for a collection of MLIR operations.
Definition: MLIRContext.h:60

mlir::MemRefDescriptor
Helper class to produce LLVM dialect operations extracting or inserting elements of a MemRef descript...
Definition: MemRefBuilder.h:33

mlir::MemRefDescriptor::getElementPtrType
LLVM::LLVMPointerType getElementPtrType()
Returns the (LLVM) pointer type this descriptor contains.
Definition: MemRefBuilder.cpp:185

mlir::MemRefDescriptor::poison
static MemRefDescriptor poison(OpBuilder &builder, Location loc, Type descriptorType)
Builds IR creating a poison value of the descriptor type.
Definition: MemRefBuilder.cpp:32

mlir::OneToOneConvertToLLVMPattern
Generic implementation of one-to-one conversion from "SourceOp" to "TargetOp" where the latter belong...
Definition: Pattern.h:207

mlir::OpBuilder
This class helps build Operations.
Definition: Builders.h:205

mlir::OpBuilder::create
Operation * create(const OperationState &state)
Creates an operation given the fields represented as an OperationState.
Definition: Builders.cpp:453

mlir::OpConversionPattern
OpConversionPattern is a wrapper around ConversionPattern that allows for matching and rewriting agai...
Definition: DialectConversion.h:583

mlir::OpFoldResult
This class represents a single result from folding an operation.
Definition: OpDefinition.h:271

mlir::Operation
Operation is the basic unit of execution within MLIR.
Definition: Operation.h:88

mlir::PatternRewriter
A special type of RewriterBase that coordinates the application of a rewrite pattern on the current I...
Definition: PatternMatch.h:749

mlir::RewritePatternSet
Definition: PatternMatch.h:772

mlir::RewriterBase::notifyMatchFailure
std::enable_if_t<!std::is_convertible< CallbackT, Twine >::value, LogicalResult > notifyMatchFailure(Location loc, CallbackT &&reasonCallback)
Used to notify the listener that the IR failed to be rewritten because of a match failure,...
Definition: PatternMatch.h:682

mlir::RewriterBase::replaceOp
virtual void replaceOp(Operation *op, ValueRange newValues)
Replace the results of the given (original) operation with the specified list of values (replacements...
Definition: PatternMatch.cpp:129

mlir::RewriterBase::replaceOpWithNewOp
OpTy replaceOpWithNewOp(Operation *op, Args &&...args)
Replace the results of the given (original) op with a new op that is created without verification (re...
Definition: PatternMatch.h:500

mlir::TypeRange
This class provides an abstraction over the various different ranges of value types.
Definition: TypeRange.h:37

mlir::Type
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
Definition: Types.h:74

mlir::Type::isIntOrIndex
bool isIntOrIndex() const
Return true if this is an integer (of any signedness) or an index type.
Definition: Types.cpp:112

mlir::Type::getIntOrFloatBitWidth
unsigned getIntOrFloatBitWidth() const
Return the bit width of an integer or a float type, assert failure on other types.
Definition: Types.cpp:122

mlir::ValueRange
This class provides an abstraction over the different types of ranges over Values.
Definition: ValueRange.h:387

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

mlir::Value::getType
Type getType() const
Return the type of this value.
Definition: Value.h:105

Arith.h

MemRef.h

BuiltinAttributes.h

BuiltinTypes.h

mlir::LLVM::detail::printType
void printType(Type type, AsmPrinter &printer)
Prints an LLVM Dialect type.
Definition: LLVMTypeSyntax.cpp:96

mlir::LLVM::detail::nDVectorIterate
void nDVectorIterate(const NDVectorTypeInfo &info, OpBuilder &builder, function_ref< void(ArrayRef< int64_t >)> fun)
Definition: VectorPattern.cpp:64

mlir::LLVM::detail::extractNDVectorTypeInfo
NDVectorTypeInfo extractNDVectorTypeInfo(VectorType vectorType, const LLVMTypeConverter &converter)
Definition: VectorPattern.cpp:19

mlir::LLVM::lookupOrCreatePrintNewlineFn
FailureOr< LLVM::LLVMFuncOp > lookupOrCreatePrintNewlineFn(OpBuilder &b, Operation *moduleOp)
Definition: FunctionCallUtils.cpp:172

mlir::LLVM::getVectorType
Type getVectorType(Type elementType, unsigned numElements, bool isScalable=false)
Creates an LLVM dialect-compatible vector type with the given element type and length.
Definition: LLVMTypes.cpp:841

mlir::LLVM::lookupOrCreatePrintOpenFn
FailureOr< LLVM::LLVMFuncOp > lookupOrCreatePrintOpenFn(OpBuilder &b, Operation *moduleOp)
Definition: FunctionCallUtils.cpp:151

mlir::LLVM::lookupOrCreatePrintCloseFn
FailureOr< LLVM::LLVMFuncOp > lookupOrCreatePrintCloseFn(OpBuilder &b, Operation *moduleOp)
Definition: FunctionCallUtils.cpp:158

mlir::LLVM::lookupOrCreatePrintF16Fn
FailureOr< LLVM::LLVMFuncOp > lookupOrCreatePrintF16Fn(OpBuilder &b, Operation *moduleOp)
Definition: FunctionCallUtils.cpp:103

mlir::LLVM::lookupOrCreatePrintBF16Fn
FailureOr< LLVM::LLVMFuncOp > lookupOrCreatePrintBF16Fn(OpBuilder &b, Operation *moduleOp)
Definition: FunctionCallUtils.cpp:111

mlir::LLVM::lookupOrCreatePrintU64Fn
FailureOr< LLVM::LLVMFuncOp > lookupOrCreatePrintU64Fn(OpBuilder &b, Operation *moduleOp)
Definition: FunctionCallUtils.cpp:96

mlir::LLVM::lookupOrCreatePrintI64Fn
FailureOr< LLVM::LLVMFuncOp > lookupOrCreatePrintI64Fn(OpBuilder &b, Operation *moduleOp)
Helper functions to look up or create the declaration for commonly used external C function calls.
Definition: FunctionCallUtils.cpp:89

mlir::LLVM::lookupOrCreatePrintCommaFn
FailureOr< LLVM::LLVMFuncOp > lookupOrCreatePrintCommaFn(OpBuilder &b, Operation *moduleOp)
Definition: FunctionCallUtils.cpp:165

mlir::LLVM::createPrintStrCall
LogicalResult createPrintStrCall(OpBuilder &builder, Location loc, ModuleOp moduleOp, StringRef symbolName, StringRef string, const LLVMTypeConverter &typeConverter, bool addNewline=true, std::optional< StringRef > runtimeFunctionName={})
Generate IR that prints the given string to stdout.
Definition: PrintCallHelper.cpp:30

mlir::LLVM::lookupOrCreatePrintF32Fn
FailureOr< LLVM::LLVMFuncOp > lookupOrCreatePrintF32Fn(OpBuilder &b, Operation *moduleOp)
Definition: FunctionCallUtils.cpp:119

mlir::LLVM::lookupOrCreatePrintF64Fn
FailureOr< LLVM::LLVMFuncOp > lookupOrCreatePrintF64Fn(OpBuilder &b, Operation *moduleOp)
Definition: FunctionCallUtils.cpp:126

mlir::arith::convertArithFastMathFlagsToLLVM
LLVM::FastmathFlags convertArithFastMathFlagsToLLVM(arith::FastMathFlags arithFMF)
Maps arithmetic fastmath enum values to LLVM enum values.
Definition: AttrToLLVMConverter.cpp:14

mlir::detail::enumerate
constexpr void enumerate(std::tuple< Tys... > &tuple, CallbackT &&callback)
Definition: Matchers.h:344

mlir::vector
Definition: ConvertVectorToLLVM.h:28

mlir::vector::populateVectorRankReducingFMAPattern
void populateVectorRankReducingFMAPattern(RewritePatternSet &patterns)
Populates a pattern that rank-reduces n-D FMAs into (n-1)-D FMAs where n > 1.
Definition: ConvertVectorToLLVM.cpp:1995

mlir::vector::registerConvertVectorToLLVMInterface
void registerConvertVectorToLLVMInterface(DialectRegistry &registry)
Definition: ConvertVectorToLLVM.cpp:2051

mlir::vector::getAsIntegers
SmallVector< int64_t > getAsIntegers(ArrayRef< Value > values)
Returns the integer numbers in values.
Definition: VectorOps.cpp:345

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::getValueOrCreateCastToIndexLike
Value getValueOrCreateCastToIndexLike(OpBuilder &b, Location loc, Type targetType, Value value)
Create a cast from an index-like value (index or integer) to another index-like value.
Definition: Utils.cpp:120

mlir::patterns
const FrozenRewritePatternSet & patterns
Definition: GreedyPatternRewriteDriver.h:283

mlir::populateVectorToLLVMConversionPatterns
void populateVectorToLLVMConversionPatterns(const LLVMTypeConverter &converter, RewritePatternSet &patterns, bool reassociateFPReductions=false, bool force32BitVectorIndices=false, bool useVectorAlignment=false)
Collect a set of patterns to convert from the Vector dialect to LLVM.
Definition: ConvertVectorToLLVM.cpp:2001

mlir::get
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
Definition: BytecodeImplementation.h:509

mlir::getMixedValues
SmallVector< OpFoldResult > getMixedValues(ArrayRef< int64_t > staticValues, ValueRange dynamicValues, MLIRContext *context)
Return a vector of OpFoldResults with the same size a staticValues, but all elements for which Shaped...
Definition: StaticValueUtils.cpp:193

mlir::populateVectorToLLVMMatrixConversionPatterns
void populateVectorToLLVMMatrixConversionPatterns(const LLVMTypeConverter &converter, RewritePatternSet &patterns)
Collect a set of patterns to convert from Vector contractions to LLVM Matrix Intrinsics.
Definition: ConvertVectorToLLVM.cpp:2028

mlir::OpRewritePattern
OpRewritePattern is a wrapper around RewritePattern that allows for matching and rewriting against an...
Definition: PatternMatch.h:314