doxygen/Tensor_2Transforms_2BufferizableOpInterfaceImpl_8cpp_source.html

 //===- BufferizableOpInterfaceImpl.cpp - Impl. of BufferizableOpInterface -===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Dialect/Tensor/Transforms/BufferizableOpInterfaceImpl.h"


 #include "mlir/Dialect/Affine/IR/AffineOps.h"

 #include "mlir/Dialect/Arith/IR/Arith.h"

 #include "mlir/Dialect/Bufferization/IR/BufferizableOpInterface.h"

 #include "mlir/Dialect/Bufferization/IR/Bufferization.h"

 #include "mlir/Dialect/Bufferization/IR/DstBufferizableOpInterfaceImpl.h"

 #include "mlir/Dialect/Linalg/IR/Linalg.h"

 #include "mlir/Dialect/MemRef/IR/MemRef.h"

 #include "mlir/Dialect/SCF/IR/SCF.h"

 #include "mlir/Dialect/Tensor/IR/Tensor.h"

 #include "mlir/Dialect/Tensor/Transforms/SubsetInsertionOpInterfaceImpl.h"

 #include "mlir/Dialect/Utils/StaticValueUtils.h"

 #include "mlir/IR/BuiltinTypeInterfaces.h"

 #include "mlir/IR/Dialect.h"

 #include "mlir/IR/Operation.h"


 using namespace mlir;

 using namespace mlir::bufferization;

 using namespace mlir::tensor;


 namespace mlir {

 namespace tensor {

 namespace {


 struct CastOpInterface

     : public BufferizableOpInterface::ExternalModel<CastOpInterface,

                                                     tensor::CastOp> {

   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,

                               const AnalysisState &state) const {

     return false;

   }


   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,

                                const AnalysisState &state) const {

     return false;

   }


   AliasingValueList getAliasingValues(Operation *op, OpOperand &opOperand,

                                       const AnalysisState &state) const {

     return {{op->getResult(0), BufferRelation::Equivalent}};

   }


   FailureOr<BaseMemRefType>

   getBufferType(Operation *op, Value value, const BufferizationOptions &options,

                 SmallVector<Value> &invocationStack) const {

     auto castOp = cast<tensor::CastOp>(op);

     auto maybeSrcBufferType = bufferization::getBufferType(

         castOp.getSource(), options, invocationStack);

     if (failed(maybeSrcBufferType))

       return failure();

     Attribute memorySpace = maybeSrcBufferType->getMemorySpace();


     // Note: `getMemRefTypeWithFullyDynamicLayout` returns an unranked memref

     // type in case the input is an unranked tensor type.


     // Case 1: Casting an unranked tensor

     if (isa<UnrankedTensorType>(castOp.getSource().getType())) {

       // When casting to a ranked tensor, we cannot infer any static offset or

       // strides from the source. Assume fully dynamic.

       return getMemRefTypeWithFullyDynamicLayout(castOp.getType(), memorySpace);

     }


     // Case 2: Casting to an unranked tensor type

     if (isa<UnrankedTensorType>(castOp.getType())) {

       return getMemRefTypeWithFullyDynamicLayout(castOp.getType(), memorySpace);

     }


     // Case 3: Ranked tensor -> ranked tensor. The offsets and strides do not

     // change.

     auto rankedResultType = cast<RankedTensorType>(castOp.getType());

     return MemRefType::get(

         rankedResultType.getShape(), rankedResultType.getElementType(),

         llvm::cast<MemRefType>(*maybeSrcBufferType).getLayout(), memorySpace);

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto castOp = cast<tensor::CastOp>(op);


     // The result buffer still has the old (pre-cast) type.

     FailureOr<Value> resultBuffer =

         getBuffer(rewriter, castOp.getSource(), options);

     if (failed(resultBuffer))

       return failure();


     // Compute the new type.

     auto resultMemRefType =

         bufferization::getBufferType(castOp.getResult(), options);

     if (failed(resultMemRefType))

       return failure();

     if (resultBuffer->getType() == *resultMemRefType) {

       // This cast is a no-op.

       replaceOpWithBufferizedValues(rewriter, op, *resultBuffer);

       return success();

     }


     // Replace the op with a memref.cast.

     assert(memref::CastOp::areCastCompatible(resultBuffer->getType(),

                                              *resultMemRefType) &&

            "CallOp::bufferize: cast incompatible");

     replaceOpWithNewBufferizedOp<memref::CastOp>(

         rewriter, op, *resultMemRefType, *resultBuffer);


     return success();

   }

 };


 /// Bufferization of tensor.collapse_shape. Replace with memref.collapse_shape.

 struct CollapseShapeOpInterface

     : public BufferizableOpInterface::ExternalModel<CollapseShapeOpInterface,

                                                     tensor::CollapseShapeOp> {

   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,

                               const AnalysisState &state) const {

     // tensor.collapse_shape may reallocate, at which point the source buffer is

     // copied. I.e., there will be a memory read side effect on the bufferized

     // source. This function conservatively returns "true" because whether a

     // copy will be created or not is not known at this point.

     return true;

   }


   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,

                                const AnalysisState &state) const {

     return false;

   }


   AliasingValueList getAliasingValues(Operation *op, OpOperand &opOperand,

                                       const AnalysisState &state) const {

     // TODO: CollapseShapeOp may allocate at runtime.

     return {{op->getOpResult(0), BufferRelation::Equivalent}};

   }


   FailureOr<BaseMemRefType>

   getBufferType(Operation *op, Value value, const BufferizationOptions &options,

                 SmallVector<Value> &invocationStack) const {

     auto collapseShapeOp = cast<tensor::CollapseShapeOp>(op);

     auto maybeSrcBufferType = bufferization::getBufferType(

         collapseShapeOp.getSrc(), options, invocationStack);

     if (failed(maybeSrcBufferType))

       return failure();

     auto srcBufferType = llvm::cast<MemRefType>(*maybeSrcBufferType);

     bool canBeCollapsed = memref::CollapseShapeOp::isGuaranteedCollapsible(

         srcBufferType, collapseShapeOp.getReassociationIndices());


     if (!canBeCollapsed) {

       // If dims cannot be collapsed, this op bufferizes to a new allocation.

       RankedTensorType tensorResultType = collapseShapeOp.getResultType();

       return bufferization::getMemRefTypeWithStaticIdentityLayout(

           tensorResultType, srcBufferType.getMemorySpace());

     }


     return memref::CollapseShapeOp::computeCollapsedType(

         srcBufferType, collapseShapeOp.getReassociationIndices());

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto collapseShapeOp = cast<tensor::CollapseShapeOp>(op);

     RankedTensorType tensorResultType = collapseShapeOp.getResultType();

     FailureOr<Value> maybeBuffer =

         getBuffer(rewriter, collapseShapeOp.getSrc(), options);

     if (failed(maybeBuffer))

       return failure();

     Value buffer = *maybeBuffer;

     auto bufferType = cast<MemRefType>(buffer.getType());


     if (tensorResultType.getRank() == 0) {

       // 0-d collapses must go through a different op builder.

       MemRefType resultType;


       if (bufferType.getLayout().isIdentity()) {

         // Standard layout: result type has no offset.

         MemRefLayoutAttrInterface layout;

         resultType = MemRefType::get({}, tensorResultType.getElementType(),

                                      layout, bufferType.getMemorySpace());

       } else {

         // Source memref has a layout map: result type has the same offset as

         // the source type.

         SmallVector<int64_t> strides;

         int64_t offset;

         if (failed(getStridesAndOffset(bufferType, strides, offset)))

           return failure();

         resultType = MemRefType::get(

             {}, tensorResultType.getElementType(),

             StridedLayoutAttr::get(op->getContext(), offset, {}),

             bufferType.getMemorySpace());

       }


       replaceOpWithNewBufferizedOp<memref::CollapseShapeOp>(

           rewriter, op, resultType, buffer, collapseShapeOp.getReassociation());

       return success();

     }


     // If the dims are not collapsible (due to an incompatible source layout

     // map), force an out-of-place bufferization, i.e., a buffer copy. This

     // newly allocated buffer will have no layout map and thus be collapsible.

     bool canBeCollapsed = memref::CollapseShapeOp::isGuaranteedCollapsible(

         bufferType, collapseShapeOp.getReassociationIndices());

     if (!canBeCollapsed) {

       // TODO: Create alloc_tensor ops during TensorCopyInsertion.

       AnalysisState analysisState(options);

       FailureOr<Value> tensorAlloc = allocateTensorForShapedValue(

           rewriter, op->getLoc(), collapseShapeOp.getSrc(), options);

       if (failed(tensorAlloc))

         return failure();

       auto memrefType =

           MemRefType::get(collapseShapeOp.getSrcType().getShape(),

                           collapseShapeOp.getSrcType().getElementType(),

                           AffineMap(), bufferType.getMemorySpace());

       buffer = rewriter.create<bufferization::ToMemrefOp>(

           op->getLoc(), memrefType, *tensorAlloc);

     }


     // Result type is inferred by the builder.

     replaceOpWithNewBufferizedOp<memref::CollapseShapeOp>(

         rewriter, op, buffer, collapseShapeOp.getReassociationIndices());

     return success();

   }

 };


 /// Bufferization of tensor.dim. Replace with memref.dim.

 struct DimOpInterface

     : public BufferizableOpInterface::ExternalModel<DimOpInterface,

                                                     tensor::DimOp> {

   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,

                               const AnalysisState &state) const {

     // The op reads the tensor's metadata but not its contents.

     return false;

   }


   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,

                                const AnalysisState &state) const {

     return false;

   }


   AliasingValueList getAliasingValues(Operation *op, OpOperand &opOperand,

                                       const AnalysisState &state) const {

     return {};

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto dimOp = cast<tensor::DimOp>(op);

     FailureOr<Value> v = getBuffer(rewriter, dimOp.getSource(), options);

     if (failed(v))

       return failure();

     replaceOpWithNewBufferizedOp<memref::DimOp>(rewriter, op, *v,

                                                 dimOp.getIndex());

     return success();

   }

 };


 /// Bufferization of "tensor.empty". Replace with "bufferization.alloc_tensor".

 struct EmptyOpInterface

     : public BufferizableOpInterface::ExternalModel<EmptyOpInterface,

                                                     tensor::EmptyOp> {

   bool bufferizesToAllocation(Operation *op, Value value) const { return true; }


   bool resultBufferizesToMemoryWrite(Operation *op, OpResult opResult,

                                      const AnalysisState &state) const {

     // The returned tensor does not have specified contents.

     return false;

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto emptyOp = cast<tensor::EmptyOp>(op);


     // Optimization: Fold away the op if it has no uses.

     if (op->getUses().empty()) {

       rewriter.eraseOp(op);

       return success();

     }


     // Allocate a tensor. This emits a "bufferization.alloc_tensor" op.

     FailureOr<Value> allocTensor = allocateTensorForShapedValue(

         rewriter, op->getLoc(), emptyOp.getResult(), options, /*copy=*/false);

     if (failed(allocTensor))

       return failure();

     rewriter.replaceOp(op, *allocTensor);

     return success();

   }

 };


 /// Bufferization of tensor.expand_shape. Replace with memref.expand_shape.

 struct ExpandShapeOpInterface

     : public BufferizableOpInterface::ExternalModel<ExpandShapeOpInterface,

                                                     tensor::ExpandShapeOp> {

   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,

                               const AnalysisState &state) const {

     // In contrast to tensor.collapse_shape, this op can always be bufferized

     // without a copy.

     return false;

   }


   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,

                                const AnalysisState &state) const {

     return false;

   }


   AliasingValueList getAliasingValues(Operation *op, OpOperand &opOperand,

                                       const AnalysisState &state) const {

     return {{op->getOpResult(0), BufferRelation::Equivalent}};

   }


   FailureOr<BaseMemRefType>

   getBufferType(Operation *op, Value value, const BufferizationOptions &options,

                 SmallVector<Value> &invocationStack) const {

     auto expandShapeOp = cast<tensor::ExpandShapeOp>(op);

     auto maybeSrcBufferType = bufferization::getBufferType(

         expandShapeOp.getSrc(), options, invocationStack);

     if (failed(maybeSrcBufferType))

       return failure();

     auto srcBufferType = llvm::cast<MemRefType>(*maybeSrcBufferType);

     auto maybeResultType = memref::ExpandShapeOp::computeExpandedType(

         srcBufferType, expandShapeOp.getResultType().getShape(),

         expandShapeOp.getReassociationIndices());

     if (failed(maybeResultType))

       return failure();

     return *maybeResultType;

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto expandShapeOp = cast<tensor::ExpandShapeOp>(op);

     auto tensorResultType = expandShapeOp.getResultType();

     FailureOr<Value> buffer =

         getBuffer(rewriter, expandShapeOp.getSrc(), options);

     if (failed(buffer))

       return failure();


     // Memref result type is inferred by the builder based on reassociation

     // indices and result shape.

     // TODO: Instead of inferring the output shape argument of

     // memref.expand_shape op, use output_shape argument of tensor.expand_shape

     // op.

     replaceOpWithNewBufferizedOp<memref::ExpandShapeOp>(

         rewriter, op, tensorResultType.getShape(), *buffer,

         expandShapeOp.getReassociationIndices());

     return success();

   }

 };


 /// Bufferization of tensor.extract_slice. Replace with memref.subview.

 struct ExtractSliceOpInterface

     : public BufferizableOpInterface::ExternalModel<ExtractSliceOpInterface,

                                                     tensor::ExtractSliceOp> {

   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,

                               const AnalysisState &state) const {

     return false;

   }


   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,

                                const AnalysisState &state) const {

     return false;

   }


   AliasingValueList getAliasingValues(Operation *op, OpOperand &opOperand,

                                       const AnalysisState &state) const {

     return {{op->getOpResult(0), BufferRelation::Unknown}};

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto extractSliceOp = cast<tensor::ExtractSliceOp>(op);

     SmallVector<OpFoldResult> mixedOffsets = extractSliceOp.getMixedOffsets();

     SmallVector<OpFoldResult> mixedSizes = extractSliceOp.getMixedSizes();

     SmallVector<OpFoldResult> mixedStrides = extractSliceOp.getMixedStrides();

     Location loc = extractSliceOp.getLoc();


     // Get source buffer.

     FailureOr<Value> srcMemref =

         getBuffer(rewriter, extractSliceOp.getSource(), options);

     if (failed(srcMemref))

       return failure();


     // Take a subview of the source buffer.

     auto resultMemrefType =

         bufferization::getBufferType(extractSliceOp.getResult(), options);

     if (failed(resultMemrefType))

       return failure();

     Value subView = rewriter.create<memref::SubViewOp>(

         loc, llvm::cast<MemRefType>(*resultMemrefType), *srcMemref,

         mixedOffsets, mixedSizes, mixedStrides);


     replaceOpWithBufferizedValues(rewriter, op, subView);

     return success();

   }


   FailureOr<BaseMemRefType>

   getBufferType(Operation *op, Value value, const BufferizationOptions &options,

                 SmallVector<Value> &invocationStack) const {

     auto extractSliceOp = cast<tensor::ExtractSliceOp>(op);

     assert(value == extractSliceOp.getResult() && "invalid value");

     auto srcMemrefType = bufferization::getBufferType(

         extractSliceOp.getSource(), options, invocationStack);

     if (failed(srcMemrefType))

       return failure();

     SmallVector<OpFoldResult> mixedOffsets = extractSliceOp.getMixedOffsets();

     SmallVector<OpFoldResult> mixedSizes = extractSliceOp.getMixedSizes();

     SmallVector<OpFoldResult> mixedStrides = extractSliceOp.getMixedStrides();

     return cast<BaseMemRefType>(memref::SubViewOp::inferRankReducedResultType(

         extractSliceOp.getType().getShape(),

         llvm::cast<MemRefType>(*srcMemrefType), mixedOffsets, mixedSizes,

         mixedStrides));

   }

 };


 /// Bufferization of tensor.extract. Replace with memref.load.

 struct ExtractOpInterface

     : public BufferizableOpInterface::ExternalModel<ExtractOpInterface,

                                                     tensor::ExtractOp> {

   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,

                               const AnalysisState &state) const {

     return true;

   }


   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,

                                const AnalysisState &state) const {

     return false;

   }


   AliasingValueList getAliasingValues(Operation *op, OpOperand &opOperand,

                                       const AnalysisState &state) const {

     return {};

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto extractOp = cast<tensor::ExtractOp>(op);

     FailureOr<Value> srcMemref =

         getBuffer(rewriter, extractOp.getTensor(), options);

     if (failed(srcMemref))

       return failure();

     replaceOpWithNewBufferizedOp<memref::LoadOp>(rewriter, op, *srcMemref,

                                                  extractOp.getIndices());

     return success();

   }

 };


 // Implements backtracking to traverse indices of the output buffer while

 // iterating over op.elements().

 static void createStores(RewriterBase &rewriter, Location loc, int dim,

                          Value buffer, ArrayRef<int64_t> shape,

                          ArrayRef<Value> constants,

                          OperandRange::iterator &elementIt,

                          SmallVectorImpl<Value> &indices) {

   if (dim == static_cast<int>(shape.size()) - 1) {

     for (int i = 0; i < shape.back(); ++i) {

       indices.back() = constants[i];

       rewriter.create<memref::StoreOp>(loc, *elementIt, buffer, indices);

       ++elementIt;

     }

     return;

   }

   for (int i = 0; i < shape[dim]; ++i) {

     indices[dim] = constants[i];

     createStores(rewriter, loc, dim + 1, buffer, shape, constants, elementIt,

                  indices);

   }

 }


 /// Bufferization of tensor.from_elements.

 struct FromElementsOpInterface

     : public BufferizableOpInterface::ExternalModel<FromElementsOpInterface,

                                                     tensor::FromElementsOp> {


   bool bufferizesToAllocation(Operation *op, Value value) const { return true; }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto fromElementsOp = cast<tensor::FromElementsOp>(op);

     auto tensorType = cast<RankedTensorType>(fromElementsOp.getType());


     // Allocate a buffer for the result.

     Location loc = op->getLoc();

     auto shape = tensorType.getShape();

     // TODO: Create alloc_tensor ops during TensorCopyInsertion.

     FailureOr<Value> tensorAlloc = allocateTensorForShapedValue(

         rewriter, loc, fromElementsOp.getResult(), options,

         /*copy=*/false);

     if (failed(tensorAlloc))

       return failure();

     FailureOr<BaseMemRefType> memrefType =

         bufferization::getBufferType(*tensorAlloc, options);

     if (failed(memrefType))

       return failure();

     Value buffer = rewriter.create<bufferization::ToMemrefOp>(

         op->getLoc(), *memrefType, *tensorAlloc);


     // Case: tensor<0xelem_type>.

     if (fromElementsOp.getElements().empty()) {

       replaceOpWithBufferizedValues(rewriter, op, buffer);

       return success();

     }


     // Case: tensor<elem_type>.

     if (shape.empty()) {

       rewriter.create<memref::StoreOp>(

           loc, fromElementsOp.getElements().front(), buffer);

       replaceOpWithBufferizedValues(rewriter, op, buffer);

       return success();

     }


     // Create constants for the range of possible indices [0, max{shape_i}).

     auto maxDim = *llvm::max_element(shape);

     SmallVector<Value, 2> constants;

     constants.reserve(maxDim);

     for (int i = 0; i < maxDim; ++i)

       constants.push_back(rewriter.create<arith::ConstantIndexOp>(loc, i));


     // Traverse all `elements` and create `memref.store` ops.

     auto elementIt = fromElementsOp.getElements().begin();

     SmallVector<Value, 2> indices(tensorType.getRank(), constants[0]);

     createStores(rewriter, loc, /*dim=*/0, buffer, shape, constants, elementIt,

                  indices);


     replaceOpWithBufferizedValues(rewriter, op, buffer);


     return success();

   }

 };


 /// Lower the body of a tensor.generate like op (one index-typed bbArg per dim).

 /// Such ops are lowered to linalg.map with the given tensor as a destination.

 ///

 /// Example:

 /// ```

 /// %r = tensor.generate %x, %y {

 ///   ^bb0(%arg0: index, %arg1: index):

 ///   %0 = "some_op"(%arg0, %arg1) : (index, index) -> (index)

 ///   tensor.yield %0 : index

 /// } : tensor<?x?xindex>

 /// ```

 ///

 /// Is lowered to:

 /// ```

 /// linalg.map ins() outs(%dest) {

 ///   %d0 = linalg.index 0 : index

 ///   %d1 = linalg.index 1 : index

 ///   %0 = "some_op"(%d0, %d1) : (index, index) -> (index)

 ///   linalg.yield %0 : index

 /// }

 /// ```

 static Value lowerGenerateLikeOpBody(RewriterBase &rewriter, Location loc,

                                      Value tensorDestination,

                                      ValueRange dynamicSizes,

                                      Region &generateBody) {

   assert(generateBody.hasOneBlock() && "expected body with single block");

   auto tensorType = cast<RankedTensorType>(tensorDestination.getType());

   assert(generateBody.getNumArguments() == tensorType.getRank() &&

          "rank mismatch");


   // Create linalg::MapOp.

   OpBuilder::InsertionGuard g(rewriter);

   auto linalgOp =

       rewriter.create<linalg::MapOp>(loc, tensorType, /*inputs=*/ValueRange(),

                                      /*init=*/tensorDestination);

   Block &linalgBody = linalgOp.getMapper().emplaceBlock();


   // Create linalg::IndexOps.

   rewriter.setInsertionPointToStart(&linalgBody);

   SmallVector<Value> indices;

   for (int64_t dim = 0; dim < tensorType.getRank(); ++dim)

     indices.push_back(rewriter.create<linalg::IndexOp>(loc, dim));


   // Move over body.

   rewriter.mergeBlocks(&generateBody.front(), &linalgBody, indices);

   auto yieldOp = cast<tensor::YieldOp>(linalgBody.getTerminator());

   rewriter.replaceOpWithNewOp<linalg::YieldOp>(yieldOp, yieldOp.getValue());


   return linalgOp.getResult()[0];

 }


 /// Bufferization of tensor.generate.

 struct GenerateOpInterface

     : public BufferizableOpInterface::ExternalModel<GenerateOpInterface,

                                                     tensor::GenerateOp> {


   bool bufferizesToAllocation(Operation *op, Value value) const { return true; }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto generateOp = cast<tensor::GenerateOp>(op);


     auto type = generateOp.getResult().getType();


     // TODO: Implement memory space for this op.

     if (options.defaultMemorySpaceFn(type) != Attribute())

       return op->emitError("memory space not implemented yet");


     // Allocate memory.

     Location loc = op->getLoc();

     FailureOr<Value> tensorAlloc = allocateTensorForShapedValue(

         rewriter, loc, generateOp.getResult(), options,

         /*copy=*/false);

     if (failed(tensorAlloc))

       return failure();


     Value result = lowerGenerateLikeOpBody(rewriter, loc, *tensorAlloc,

                                            generateOp.getDynamicExtents(),

                                            generateOp.getBody());

     rewriter.replaceOp(generateOp, result);


     return success();

   }

 };


 /// Bufferization of tensor.insert. Replace with memref.store.

 ///

 /// Note: DstBufferizableOpInterfaceExternalModel provides many default method

 /// implementations for DestinationStyle ops.

 struct InsertOpInterface

     : public DstBufferizableOpInterfaceExternalModel<InsertOpInterface,

                                                      tensor::InsertOp> {

   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto insertOp = cast<tensor::InsertOp>(op);

     FailureOr<Value> destMemref =

         getBuffer(rewriter, insertOp.getDest(), options);

     if (failed(destMemref))

       return failure();

     rewriter.create<memref::StoreOp>(insertOp.getLoc(), insertOp.getScalar(),

                                      *destMemref, insertOp.getIndices());

     replaceOpWithBufferizedValues(rewriter, op, *destMemref);

     return success();

   }

 };


 template <typename InsertOpTy>

 static bool insertSliceOpRequiresRead(InsertOpTy insertSliceOp,

                                       OpOperand &opOperand) {

   // The source is always read.

   if (opOperand == insertSliceOp.getSourceMutable())

     return true;


   // For the destination, it depends...

   assert(opOperand == insertSliceOp.getDestMutable() && "expected dest");


   // Dest is not read if it is entirely overwritten. E.g.:

   // tensor.insert_slice %a into %t[0][10][1] : ... into tensor<10xf32>

   bool allOffsetsZero =

       llvm::all_of(insertSliceOp.getMixedOffsets(), isZeroIndex);

   RankedTensorType destType = insertSliceOp.getDestType();

   bool sizesMatchDestSizes =

       areConstantIntValues(insertSliceOp.getMixedSizes(), destType.getShape());

   bool allStridesOne =

       areAllConstantIntValue(insertSliceOp.getMixedStrides(), 1);

   return !(allOffsetsZero && sizesMatchDestSizes && allStridesOne);

 }


 /// Bufferization of tensor.insert_slice. Replace with a memory copy. Under

 /// certain circumstances, this op can also be a no-op.

 ///

 /// Note: DstBufferizableOpInterfaceExternalModel provides many default method

 /// implementations for DestinationStyle ops.

 struct InsertSliceOpInterface

     : public DstBufferizableOpInterfaceExternalModel<InsertSliceOpInterface,

                                                      tensor::InsertSliceOp> {

   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,

                               const AnalysisState &state) const {

     return insertSliceOpRequiresRead(cast<tensor::InsertSliceOp>(op),

                                      opOperand);

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     // insert_slice ops arise from tiling and bufferizing them out-of-place is

     // generally a deal breaker. When used with loops, this ends up cloning the

     // whole tensor on every single iteration and is a symptom of a

     // catastrophically bad scheduling decision.

     // TODO: be very loud about it or even consider failing the pass.

     auto insertSliceOp = cast<tensor::InsertSliceOp>(op);

     SmallVector<OpFoldResult> mixedOffsets = insertSliceOp.getMixedOffsets();

     SmallVector<OpFoldResult> mixedSizes = insertSliceOp.getMixedSizes();

     SmallVector<OpFoldResult> mixedStrides = insertSliceOp.getMixedStrides();

     Location loc = insertSliceOp.getLoc();


     // Get destination buffer.

     FailureOr<Value> dstMemref =

         getBuffer(rewriter, insertSliceOp.getDest(), options);

     if (failed(dstMemref))

       return failure();


     // Take a subview of the destination buffer.

     auto dstMemrefType = cast<MemRefType>(dstMemref->getType());

     auto subviewMemRefType =

         cast<MemRefType>(memref::SubViewOp::inferRankReducedResultType(

             insertSliceOp.getSourceType().getShape(), dstMemrefType,

             mixedOffsets, mixedSizes, mixedStrides));

     Value subView = rewriter.create<memref::SubViewOp>(

         loc, subviewMemRefType, *dstMemref, mixedOffsets, mixedSizes,

         mixedStrides);


     // Copy tensor. If this tensor.insert_slice has a matching

     // tensor.extract_slice, the copy operation will eventually fold away.

     FailureOr<Value> srcMemref =

         getBuffer(rewriter, insertSliceOp.getSource(), options);

     if (failed(srcMemref))

       return failure();

     if (failed(options.createMemCpy(rewriter, loc, *srcMemref, subView)))

       return failure();


     replaceOpWithBufferizedValues(rewriter, op, *dstMemref);

     return success();

   }

 };


 /// Bufferization of tensor.pad. Replace with bufferization.alloc_tensor +

 /// linalg.map + insert_slice.

 /// For best performance, vectorize before bufferization (better performance in

 /// case of padding with a constant).

 struct PadOpInterface

     : public BufferizableOpInterface::ExternalModel<PadOpInterface,

                                                     tensor::PadOp> {

   bool bufferizesToAllocation(Operation *op, Value value) const { return true; }


   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,

                               const AnalysisState &state) const {

     return true;

   }


   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,

                                const AnalysisState &state) const {

     return false;

   }


   AliasingValueList getAliasingValues(Operation *op, OpOperand &opOperand,

                                       const AnalysisState &state) const {

     return {};

   }


   FailureOr<BaseMemRefType>

   getBufferType(Operation *op, Value value, const BufferizationOptions &options,

                 SmallVector<Value> &invocationStack) const {

     // Infer memory space from the source tensor.

     auto padOp = cast<tensor::PadOp>(op);

     auto maybeSrcBufferType = bufferization::getBufferType(

         padOp.getSource(), options, invocationStack);

     if (failed(maybeSrcBufferType))

       return failure();

     MemRefLayoutAttrInterface layout;

     return MemRefType::get(padOp.getResultType().getShape(),

                            padOp.getResultType().getElementType(), layout,

                            maybeSrcBufferType->getMemorySpace());

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto padOp = cast<tensor::PadOp>(op);

     Location loc = padOp.getLoc();

     RankedTensorType resultType = padOp.getResultType();

     RankedTensorType srcType = padOp.getSourceType();


     auto toValue = [&](OpFoldResult ofr) {

       if (auto value = dyn_cast<Value>(ofr))

         return value;

       return rewriter

           .create<arith::ConstantIndexOp>(loc, *getConstantIntValue(ofr))

           .getResult();

     };


     // Compute dynamic result dimensions.

     SmallVector<OpFoldResult> mixedLowPad = padOp.getMixedLowPad();

     SmallVector<OpFoldResult> mixedHighPad = padOp.getMixedHighPad();

     SmallVector<Value> dynamicSizes;

     for (int64_t i = 0; i < resultType.getRank(); ++i) {

       if (!resultType.isDynamicDim(i))

         continue;

       Value srcDim = rewriter.create<tensor::DimOp>(loc, padOp.getSource(), i);

       Value lowPad = toValue(mixedLowPad[i]);

       Value highPad = toValue(mixedHighPad[i]);

       AffineExpr s0, s1, s2;

       bindSymbols(op->getContext(), s0, s1, s2);

       AffineExpr sumExpr = s0 + s1 + s2;

       Value sum = rewriter.create<affine::AffineApplyOp>(

           loc, sumExpr, ValueRange{srcDim, lowPad, highPad});

       dynamicSizes.push_back(sum);

     }


     // Allocate a buffer for the padded result.

     FailureOr<Value> tensorAlloc =

         allocateTensorForShapedValue(rewriter, loc, padOp.getResult(), options,

                                      /*copy=*/false);

     if (failed(tensorAlloc))

       return failure();


     // tensor::PadOp is like tensor::GenerateOp: The only difference is that

     // only a part of the generated tensor is needed. For simplicity, we reuse

     // the same functionality here.

     Value filledBuffer = lowerGenerateLikeOpBody(

         rewriter, loc, *tensorAlloc, dynamicSizes, padOp.getBodyRegion());


     // Create tensor::InsertSliceOp.

     SmallVector<OpFoldResult> sliceSizes =

         getMixedSizes(rewriter, loc, padOp.getSource());

     SmallVector<OpFoldResult> sliceStrides(srcType.getRank(),

                                            rewriter.getIndexAttr(1));

     rewriter.replaceOpWithNewOp<tensor::InsertSliceOp>(

         padOp, padOp.getSource(), filledBuffer,

         /*offsets=*/padOp.getMixedLowPad(), sliceSizes, sliceStrides);


     return success();

   }

 };


 /// Bufferization of tensor.rank. Replace with memref.rank.

 struct RankOpInterface

     : public BufferizableOpInterface::ExternalModel<RankOpInterface,

                                                     tensor::RankOp> {

   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,

                               const AnalysisState &state) const {

     // The op reads the tensor's metadata but not its contents.

     return false;

   }


   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,

                                const AnalysisState &state) const {

     return false;

   }


   AliasingValueList getAliasingValues(Operation *op, OpOperand &opOperand,

                                       const AnalysisState &state) const {

     return {};

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto rankOp = cast<tensor::RankOp>(op);

     FailureOr<Value> v = getBuffer(rewriter, rankOp.getTensor(), options);

     if (failed(v))

       return failure();

     replaceOpWithNewBufferizedOp<memref::RankOp>(rewriter, op, rankOp.getType(),

                                                  *v);

     return success();

   }

 };


 /// Bufferization of tensor.reshape. Replace with memref.reshape.

 struct ReshapeOpInterface

     : public BufferizableOpInterface::ExternalModel<ReshapeOpInterface,

                                                     tensor::ReshapeOp> {

   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,

                               const AnalysisState &state) const {

     // Depending on the layout map, the source buffer may have to be copied.

     auto reshapeOp = cast<tensor::ReshapeOp>(op);

     return opOperand == reshapeOp.getShapeMutable();

   }


   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,

                                const AnalysisState &state) const {

     return false;

   }


   AliasingValueList getAliasingValues(Operation *op, OpOperand &opOperand,

                                       const AnalysisState &state) const {

     return {{op->getOpResult(0), BufferRelation::Equivalent}};

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     auto reshapeOp = cast<tensor::ReshapeOp>(op);

     FailureOr<Value> srcBuffer =

         getBuffer(rewriter, reshapeOp.getSource(), options);

     FailureOr<Value> shapeBuffer =

         getBuffer(rewriter, reshapeOp.getShape(), options);

     if (failed(srcBuffer) || failed(shapeBuffer))

       return failure();

     auto maybeResultMemRefType =

         bufferization::getBufferType(reshapeOp.getResult(), options);

     if (failed(maybeResultMemRefType))

       return failure();


     // memref.reshape requires the source buffer to have an identity layout.

     // If the source memref does not have an identity layout, copy the source

     // into a new buffer with an identity layout.

     auto srcType = llvm::dyn_cast<MemRefType>(srcBuffer->getType());

     if (srcType && !srcType.getLayout().isIdentity()) {

       FailureOr<Value> tensorAlloc = allocateTensorForShapedValue(

           rewriter, op->getLoc(), reshapeOp.getSource(), options);

       if (failed(tensorAlloc))

         return failure();

       auto memrefType = MemRefType::get(

           srcType.getShape(), srcType.getElementType(), AffineMap(),

           cast<BaseMemRefType>(srcBuffer->getType()).getMemorySpace());

       srcBuffer = rewriter

                       .create<bufferization::ToMemrefOp>(

                           op->getLoc(), memrefType, *tensorAlloc)

                       .getResult();

     }


     replaceOpWithNewBufferizedOp<memref::ReshapeOp>(

         rewriter, op, maybeResultMemRefType.value(), *srcBuffer, *shapeBuffer);

     return success();

   }


   FailureOr<BaseMemRefType>

   getBufferType(Operation *op, Value value, const BufferizationOptions &options,

                 SmallVector<Value> &invocationStack) const {

     auto reshapeOp = cast<tensor::ReshapeOp>(op);

     assert(value == reshapeOp.getResult() && "unexpected value provided");

     auto maybeSourceBufferType = bufferization::getBufferType(

         reshapeOp.getSource(), options, invocationStack);

     if (failed(maybeSourceBufferType))

       return failure();

     return getMemRefTypeWithStaticIdentityLayout(

         reshapeOp.getResult().getType(),

         cast<BaseMemRefType>(maybeSourceBufferType.value()).getMemorySpace());

   }

 };


 /// Analysis of ParallelInsertSliceOp.

 struct ParallelInsertSliceOpInterface

     : public BufferizableOpInterface::ExternalModel<

           ParallelInsertSliceOpInterface, ParallelInsertSliceOp> {

   AliasingValueList getAliasingValues(Operation *op, OpOperand &opOperand,

                                       const AnalysisState &state) const {

     return {};

   }


   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,

                               const AnalysisState &state) const {

     return insertSliceOpRequiresRead(cast<tensor::ParallelInsertSliceOp>(op),

                                      opOperand);

   }


   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,

                                const AnalysisState &state) const {

     auto parallelInsertSliceOp = cast<ParallelInsertSliceOp>(op);

     return opOperand == parallelInsertSliceOp.getDestMutable();

   }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     OpBuilder::InsertionGuard g(rewriter);

     auto parallelInsertSliceOp = cast<ParallelInsertSliceOp>(op);

     ParallelCombiningOpInterface parallelCombiningParent =

         parallelInsertSliceOp.getParallelCombiningParent();


     // Bufferize the op outside of the parallel combining terminator.

     rewriter.setInsertionPoint(parallelCombiningParent);


     // Get source and destination buffers.

     FailureOr<Value> destBuffer =

         getBuffer(rewriter, parallelInsertSliceOp.getDest(), options);

     if (failed(destBuffer))

       return failure();

     FailureOr<Value> srcBuffer =

         getBuffer(rewriter, parallelInsertSliceOp.getSource(), options);

     if (failed(srcBuffer))

       return failure();


     // Take a subview of the destination buffer.

     auto destBufferType = cast<MemRefType>(destBuffer->getType());

     auto subviewMemRefType =

         cast<MemRefType>(memref::SubViewOp::inferRankReducedResultType(

             parallelInsertSliceOp.getSourceType().getShape(), destBufferType,

             parallelInsertSliceOp.getMixedOffsets(),

             parallelInsertSliceOp.getMixedSizes(),

             parallelInsertSliceOp.getMixedStrides()));

     Value subview = rewriter.create<memref::SubViewOp>(

         parallelInsertSliceOp.getLoc(), subviewMemRefType, *destBuffer,

         parallelInsertSliceOp.getMixedOffsets(),

         parallelInsertSliceOp.getMixedSizes(),

         parallelInsertSliceOp.getMixedStrides());


     // This memcpy will fold away if everything bufferizes in-place.

     if (failed(options.createMemCpy(rewriter, parallelInsertSliceOp.getLoc(),

                                     *srcBuffer, subview)))

       return failure();


     // In case the source was allocated in the same block, make sure that the

     // deallocation op (if any) appears after the memcpy. By default, deallocs

     // are placed before the terminator, but this does not work for ForallOp

     // because the terminator does more than just yielding a value.

     //

     // Note: This is not a problem for the destination buffer because these are

     // assumed to always bufferize in-place.

     for (Operation *user : srcBuffer->getUsers()) {

       if (hasEffect<MemoryEffects::Free>(user)) {

         if (user->getBlock() == parallelCombiningParent->getBlock())

           rewriter.moveOpBefore(user, user->getBlock()->getTerminator());

         break;

       }

     }


     // Delete the op.

     rewriter.eraseOp(op);

     return success();

   }


   /// tensor.parallel_insert_slice op has implicit inplace behavior. We

   /// shouldn't create copy to resolve conflict.

   LogicalResult resolveConflicts(Operation *op, RewriterBase &rewriter,

                                  const AnalysisState &state) const {

     return success();

   }

 };


 /// Bufferization of tensor.splat. Bufferizes to a new allocation that is filled

 /// with a linalg.map. Similar to tensor.generate.

 struct SplatOpInterface

     : public BufferizableOpInterface::ExternalModel<SplatOpInterface,

                                                     tensor::SplatOp> {


   bool bufferizesToAllocation(Operation *op, Value value) const { return true; }


   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,

                           const BufferizationOptions &options) const {

     OpBuilder::InsertionGuard g(rewriter);

     auto splatOp = cast<tensor::SplatOp>(op);


     // Allocate memory.

     Location loc = op->getLoc();

     FailureOr<Value> tensorAlloc = allocateTensorForShapedValue(

         rewriter, loc, splatOp.getResult(), options,

         /*copy=*/false);

     if (failed(tensorAlloc))

       return failure();


     // Create linalg::MapOp.

     auto tensorType = cast<RankedTensorType>(tensorAlloc->getType());


     // TODO: Implement memory space for this op.

     if (options.defaultMemorySpaceFn(tensorType) != Attribute())

       return op->emitError("memory space not implemented yet");


     auto linalgOp =

         rewriter.create<linalg::MapOp>(loc, tensorType, /*inputs=*/ValueRange(),

                                        /*init=*/*tensorAlloc);

     Block &linalgBody = linalgOp.getMapper().emplaceBlock();


     // Create linalg::IndexOps.

     rewriter.setInsertionPointToStart(&linalgBody);

     rewriter.create<linalg::YieldOp>(loc, splatOp.getInput());

     rewriter.replaceOp(splatOp, linalgOp.getResult()[0]);


     return success();

   }

 };


 } // namespace

 } // namespace tensor

 } // namespace mlir


 void mlir::tensor::registerBufferizableOpInterfaceExternalModels(

     DialectRegistry &registry) {

   registry.addExtension(+[](MLIRContext *ctx, tensor::TensorDialect *dialect) {

     CastOp::attachInterface<CastOpInterface>(*ctx);

     CollapseShapeOp::attachInterface<CollapseShapeOpInterface>(*ctx);

     DimOp::attachInterface<DimOpInterface>(*ctx);

     EmptyOp::attachInterface<EmptyOpInterface>(*ctx);

     ExpandShapeOp::attachInterface<ExpandShapeOpInterface>(*ctx);

     ExtractSliceOp::attachInterface<ExtractSliceOpInterface>(*ctx);

     ExtractOp::attachInterface<ExtractOpInterface>(*ctx);

     FromElementsOp::attachInterface<FromElementsOpInterface>(*ctx);

     GenerateOp::attachInterface<GenerateOpInterface>(*ctx);

     InsertOp::attachInterface<InsertOpInterface>(*ctx);

     InsertSliceOp::attachInterface<InsertSliceOpInterface>(*ctx);

     PadOp::attachInterface<PadOpInterface>(*ctx);

     ParallelInsertSliceOp::attachInterface<ParallelInsertSliceOpInterface>(

         *ctx);

     RankOp::attachInterface<RankOpInterface>(*ctx);

     ReshapeOp::attachInterface<ReshapeOpInterface>(*ctx);

     SplatOp::attachInterface<SplatOpInterface>(*ctx);


     // Load additional dialects of which ops may get created.

     ctx->loadDialect<arith::ArithDialect, linalg::LinalgDialect>();

   });


   // Bufferization requires SubsetInsertionOpInterface models. Make sure that

   // they are registered.

   tensor::registerSubsetOpInterfaceExternalModels(registry);

 }

AffineOps.h

BufferizableOpInterface.h

Bufferization.h

BuiltinTypeInterfaces.h

DstBufferizableOpInterfaceImpl.h

Dialect.h

Operation.h

options
static llvm::ManagedStatic< PassManagerOptions > options
Definition: PassManagerOptions.cpp:89

StaticValueUtils.h

BufferizableOpInterfaceImpl.h

SubsetInsertionOpInterfaceImpl.h

llvm::ArrayRef
Definition: LLVM.h:48

llvm::SmallVectorImpl
Definition: LLVM.h:74

llvm::SmallVector
Definition: LLVM.h:72

mlir::AffineExpr
Base type for affine expression.
Definition: AffineExpr.h:68

mlir::AffineMap
A multi-dimensional affine map Affine map's are immutable like Type's, and they are uniqued.
Definition: AffineMap.h:46

mlir::AnalysisState
Base class for generic analysis states.
Definition: DataFlowFramework.h:454

mlir::Attribute
Attributes are known-constant values of operations.
Definition: Attributes.h:25

mlir::Block
Block represents an ordered list of Operations.
Definition: Block.h:33

mlir::Builder::getIndexAttr
IntegerAttr getIndexAttr(int64_t value)
Definition: Builders.cpp:148

mlir::DialectRegistry
The DialectRegistry maps a dialect namespace to a constructor for the matching dialect.
Definition: DialectRegistry.h:139

mlir::DialectRegistry::addExtension
bool addExtension(TypeID extensionID, std::unique_ptr< DialectExtensionBase > extension)
Add the given extension to the registry.
Definition: DialectRegistry.h:211

mlir::Location
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
Definition: Location.h:66

mlir::MLIRContext
MLIRContext is the top-level object for a collection of MLIR operations.
Definition: MLIRContext.h:60

mlir::MLIRContext::loadDialect
void loadDialect()
Load a dialect in the context.
Definition: MLIRContext.h:107

mlir::OpBuilder::InsertionGuard
RAII guard to reset the insertion point of the builder when destroyed.
Definition: Builders.h:357

mlir::OpBuilder::setInsertionPointToStart
void setInsertionPointToStart(Block *block)
Sets the insertion point to the start of the specified block.
Definition: Builders.h:440

mlir::OpBuilder::setInsertionPoint
void setInsertionPoint(Block *block, Block::iterator insertPoint)
Set the insertion point to the specified location.
Definition: Builders.h:407

mlir::OpBuilder::create
Operation * create(const OperationState &state)
Creates an operation given the fields represented as an OperationState.
Definition: Builders.cpp:497

mlir::OpFoldResult
This class represents a single result from folding an operation.
Definition: OpDefinition.h:268

mlir::OpOperand
This class represents an operand of an operation.
Definition: Value.h:267

mlir::OpResult
This is a value defined by a result of an operation.
Definition: Value.h:457

mlir::Operation
Operation is the basic unit of execution within MLIR.
Definition: Operation.h:88

mlir::Operation::getOpResult
OpResult getOpResult(unsigned idx)
Definition: Operation.h:421

mlir::Operation::getResult
OpResult getResult(unsigned idx)
Get the 'idx'th result of this operation.
Definition: Operation.h:407

mlir::Operation::getContext
MLIRContext * getContext()
Return the context this operation is associated with.
Definition: Operation.h:216

mlir::Operation::getLoc
Location getLoc()
The source location the operation was defined or derived from.
Definition: Operation.h:223

mlir::Operation::emitError
InFlightDiagnostic emitError(const Twine &message={})
Emit an error about fatal conditions with this operation, reporting up to any diagnostic handlers tha...
Definition: Operation.cpp:268

mlir::Operation::getUsers
user_range getUsers()
Returns a range of all users.
Definition: Operation.h:874

mlir::Operation::getUses
use_range getUses()
Returns a range of all uses, which is useful for iterating over all uses.
Definition: Operation.h:847

mlir::Region
This class contains a list of basic blocks and a link to the parent operation it is attached to.
Definition: Region.h:26

mlir::Region::getNumArguments
unsigned getNumArguments()
Definition: Region.h:123

mlir::Region::front
Block & front()
Definition: Region.h:65

mlir::Region::hasOneBlock
bool hasOneBlock()
Return true if this region has exactly one block.
Definition: Region.h:68

mlir::RewriterBase
This class coordinates the application of a rewrite on a set of IR, providing a way for clients to tr...
Definition: PatternMatch.h:400

mlir::RewriterBase::replaceOp
virtual void replaceOp(Operation *op, ValueRange newValues)
Replace the results of the given (original) operation with the specified list of values (replacements...
Definition: PatternMatch.cpp:133

mlir::RewriterBase::mergeBlocks
void mergeBlocks(Block *source, Block *dest, ValueRange argValues=std::nullopt)
Inline the operations of block 'source' into the end of block 'dest'.
Definition: PatternMatch.cpp:339

mlir::RewriterBase::eraseOp
virtual void eraseOp(Operation *op)
This method erases an operation that is known to have no uses.
Definition: PatternMatch.cpp:161

mlir::RewriterBase::moveOpBefore
void moveOpBefore(Operation *op, Operation *existingOp)
Unlink this operation from its current block and insert it right before existingOp which may be in th...
Definition: PatternMatch.cpp:403

mlir::RewriterBase::replaceOpWithNewOp
OpTy replaceOpWithNewOp(Operation *op, Args &&...args)
Replace the results of the given (original) op with a new op that is created without verification (re...
Definition: PatternMatch.h:542

mlir::ValueRange
This class provides an abstraction over the different types of ranges over Values.
Definition: ValueRange.h:381

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

mlir::Value::getType
Type getType() const
Return the type of this value.
Definition: Value.h:129

mlir::bufferization::AliasList
Definition: BufferizableOpInterface.h:64

Arith.h

Linalg.h

MemRef.h

SCF.h

Tensor.h

mlir::bufferization
Definition: BufferDeallocationOpInterface.h:18

mlir::bufferization::replaceOpWithBufferizedValues
void replaceOpWithBufferizedValues(RewriterBase &rewriter, Operation *op, ValueRange values)
Replace an op with replacement values.
Definition: BufferizableOpInterface.cpp:703

mlir::bufferization::getMemRefTypeWithStaticIdentityLayout
BaseMemRefType getMemRefTypeWithStaticIdentityLayout(TensorType tensorType, Attribute memorySpace=nullptr)
Return a MemRef type with a static identity layout (i.e., no layout map).
Definition: BufferizableOpInterface.cpp:817

mlir::bufferization::allocateTensorForShapedValue
FailureOr< Value > allocateTensorForShapedValue(OpBuilder &b, Location loc, Value shapedValue, const BufferizationOptions &options, bool copy=true)
Create an AllocTensorOp for the given shaped value (memref or tensor).
Definition: BufferizableOpInterface.cpp:146

mlir::bufferization::getBufferType
FailureOr< BaseMemRefType > getBufferType(Value value, const BufferizationOptions &options)
Return the buffer type for a given Value (tensor) after bufferization without bufferizing any IR.
Definition: BufferizableOpInterface.cpp:667

mlir::bufferization::getBuffer
FailureOr< Value > getBuffer(RewriterBase &rewriter, Value value, const BufferizationOptions &options)
Lookup the buffer for the given value.
Definition: BufferizableOpInterface.cpp:642

mlir::bufferization::getMemRefTypeWithFullyDynamicLayout
BaseMemRefType getMemRefTypeWithFullyDynamicLayout(TensorType tensorType, Attribute memorySpace=nullptr)
Return a MemRef type with fully dynamic layout.
Definition: BufferizableOpInterface.cpp:793

mlir::bufferization::BufferRelation::Unknown
@ Unknown

mlir::bufferization::BufferRelation::Equivalent
@ Equivalent

mlir::memref::getMixedSizes
SmallVector< OpFoldResult > getMixedSizes(OpBuilder &builder, Location loc, Value value)
Return the dimensions of the given memref value.
Definition: MemRefOps.cpp:77

mlir::tensor
Definition: BufferizationTransformOps.h:19

mlir::tensor::registerSubsetOpInterfaceExternalModels
void registerSubsetOpInterfaceExternalModels(DialectRegistry &registry)
Definition: SubsetInsertionOpInterfaceImpl.cpp:87

mlir::tensor::registerBufferizableOpInterfaceExternalModels
void registerBufferizableOpInterfaceExternalModels(DialectRegistry &registry)
Definition: BufferizableOpInterfaceImpl.cpp:1054

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::isZeroIndex
bool isZeroIndex(OpFoldResult v)
Return true if v is an IntegerAttr with value 0 of a ConstantIndexOp with attribute with value 0.
Definition: StaticValueUtils.cpp:18

mlir::areConstantIntValues
bool areConstantIntValues(ArrayRef< OpFoldResult > ofrs, ArrayRef< int64_t > values)
Return true if all of ofrs are constant integers equal to the corresponding value in values.
Definition: StaticValueUtils.cpp:159

mlir::getConstantIntValue
std::optional< int64_t > getConstantIntValue(OpFoldResult ofr)
If ofr is a constant integer or an IntegerAttr, return the integer.
Definition: StaticValueUtils.cpp:120

mlir::areAllConstantIntValue
bool areAllConstantIntValue(ArrayRef< OpFoldResult > ofrs, int64_t value)
Return true if all of ofrs are constant integers equal to value.
Definition: StaticValueUtils.cpp:154

mlir::getStridesAndOffset
LogicalResult getStridesAndOffset(MemRefType t, SmallVectorImpl< int64_t > &strides, int64_t &offset)
Returns the strides of the MemRef if the layout map is in strided form.
Definition: BuiltinTypes.cpp:804

mlir::bindSymbols
void bindSymbols(MLIRContext *ctx, AffineExprTy &...exprs)
Bind a list of AffineExpr references to SymbolExpr at positions: [0 .
Definition: AffineExpr.h:362

mlir::get
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
Definition: BytecodeImplementation.h:509

mlir::bufferization::BufferizationOptions
Options for BufferizableOpInterface-based bufferization.
Definition: BufferizableOpInterface.h:252

mlir::bufferization::DstBufferizableOpInterfaceExternalModel
Bufferizable ops that implement the DestinationStyleOpInterface can use this external model base clas...
Definition: DstBufferizableOpInterfaceImpl.h:23