doxygen/DropRedundantRankExpansionPatterns_8cpp_source.html

//===- DropRedundantRankExpansionPatterns.cpp -----------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//


#include "mlir/Dialect/Affine/ViewLikeInterfaceUtils.h"

#include "mlir/Dialect/Tensor/IR/Tensor.h"

#include "mlir/Dialect/Tensor/Transforms/Transforms.h"

#include "mlir/Dialect/Tensor/Utils/Utils.h"

#include "mlir/IR/BuiltinTypes.h"

#include "mlir/IR/OpDefinition.h"

#include "mlir/IR/PatternMatch.h"


using namespace mlir;

using namespace mlir::tensor;


namespace {

/// Drop redundant rank expansion of insert_slice that are directly followed

/// by extract_slice. E.g.:

/// %0 = tensor.insert_slice %in... : tensor<5x10xf32> into tensor<1x1x5x10xf32>

/// %1 = tensor.extract_slice %0[0, 0, 2, 3] [1, 1, 2, 2] [1, 1, 1, 1]

///     : tensor<1x1x5x10xf32> to tensor<2x2xf32>

///

/// can be folded into:

///

/// %1 = tensor.extract_slice %in[2, 3] [2, 2] [1, 1]

///     : tensor<5x10xf32> to tensor<2x2xf32>

struct DropRedundantRankExpansionOnExtractSliceOfInsertSlice

    : public OpRewritePattern<ExtractSliceOp> {

  using OpRewritePattern::OpRewritePattern;


  LogicalResult matchAndRewrite(ExtractSliceOp extractSliceOp,

                                PatternRewriter &rewriter) const override {

    // Nothing to do if no dims are dropped.

    llvm::SmallBitVector droppedDims = extractSliceOp.getDroppedDims();

    if (droppedDims.none())

      return failure();


    // Look for tensor.insert_slice op that has an inverse rank expansion.

    auto insertSliceOp =

        extractSliceOp.getSource().getDefiningOp<InsertSliceOp>();

    if (!insertSliceOp)

      return failure();

    llvm::SmallBitVector expandedDims = insertSliceOp.getDroppedDims();


    // Support cases where the expanded dims are a subset of the droped dims.

    if (!expandedDims.subsetOf(droppedDims))

      return failure();


    // The tensor.insert_slice may not be redundant if it has multiple users.

    if (!insertSliceOp->hasOneUse())

      return failure();


    // Only consider tensor.insert_slice ops that are pure rank-reductions.

    // I.e., no elements are taken from the destination.

    if (!isCastLikeInsertSliceOp(insertSliceOp))

      return failure();


    // Extract directly from the source.

    OpBuilder::InsertionGuard g(rewriter);

    rewriter.setInsertionPoint(extractSliceOp);

    SmallVector<OpFoldResult> mixedOffsets = extractSliceOp.getMixedOffsets();

    SmallVector<OpFoldResult> mixedSizes = extractSliceOp.getMixedSizes();

    SmallVector<OpFoldResult> mixedStrides = extractSliceOp.getMixedStrides();

    SmallVector<OpFoldResult> newOffsets, newSizes, newStrides;

    for (int64_t i = 0, e = extractSliceOp.getSourceType().getRank(); i < e;

         ++i) {

      if (expandedDims.test(i))

        continue;

      newOffsets.push_back(mixedOffsets[i]);

      newSizes.push_back(mixedSizes[i]);

      newStrides.push_back(mixedStrides[i]);

    }

    rewriter.replaceOpWithNewOp<ExtractSliceOp>(

        extractSliceOp, extractSliceOp.getResultType(),

        /*source=*/insertSliceOp.getSource(), newOffsets, newSizes, newStrides);

    rewriter.eraseOp(insertSliceOp);

    return success();

  }

};


/// Drop redundant rank expansion of insert_slice that direclty follows

/// extract_slice.

///

/// This can be done when the insert_slice op purely expands ranks (adds unit

/// dims) and the extrace_slice drops corresponding unit dims. For example:

///

/// %extracted_slice = tensor.extract_slice %in[0, 0] [1, 8] [1, 1]

///     : tensor<2x8xf32> to tensor<8xf32>

/// %inserted_slice = tensor.insert_slice %extracted_slice

///     into %dest[0, 0] [1, 8] [1, 1]

///     : tensor<8xf32> into tensor<1x8xf32>

///

/// can be folded into:

///

/// %extracted_slice = tensor.extract_slice %in[0, 0] [1, 8] [1, 1]

///     : tensor<2x8xf32> to tensor<1x8xf32>

struct DropRedundantRankExpansionOnInsertSliceOfExtractSlice final

    : public OpRewritePattern<tensor::InsertSliceOp> {

  using OpRewritePattern<tensor::InsertSliceOp>::OpRewritePattern;


  LogicalResult matchAndRewrite(tensor::InsertSliceOp insertSliceOp,

                                PatternRewriter &rewriter) const override {

    auto extractSliceOp =

        insertSliceOp.getSource().getDefiningOp<tensor::ExtractSliceOp>();

    if (!extractSliceOp) {

      return rewriter.notifyMatchFailure(insertSliceOp,

                                         "source is not extract_slice");

    }


    // Can't fold if the extract_slice op has other users.

    if (!extractSliceOp->hasOneUse()) {

      return rewriter.notifyMatchFailure(insertSliceOp,

                                         "source has multi-uses");

    }


    // Check if the insert_slice op purely expands ranks (add unit dims).

    if (!isCastLikeInsertSliceOp(insertSliceOp)) {

      return rewriter.notifyMatchFailure(insertSliceOp,

                                         "insert_slice is not cast-like");

    }


    llvm::SmallBitVector extractDroppedDims = extractSliceOp.getDroppedDims();

    llvm::SmallBitVector insertDroppedDims = insertSliceOp.getDroppedDims();

    // Can't fold if the insert_slice op expands to more dims.

    if (extractDroppedDims.size() < insertDroppedDims.size()) {

      return rewriter.notifyMatchFailure(insertSliceOp,

                                         "insert_slice expands more dims");

    }


    // Try to match the extract dropped dims to the insert dropped dims. This is

    // done by scanning the dims of extract_slice and find the left-most one can

    // match the dim of insert_slice. If a match is found, advance the dim of

    // insert_slice to match the next one.

    unsigned insertDimPos = 0;

    for (unsigned extractDimPos = 0; extractDimPos < extractDroppedDims.size();

         ++extractDimPos) {

      // Matched all dims.

      if (insertDimPos == insertDroppedDims.size())

        break;


      bool isExtractDropped = extractDroppedDims[extractDimPos];

      bool isInsertDropped = insertDroppedDims[insertDimPos];

      // Match if both sides drop/keep the dim. Advance and match the next dim

      // of insert_slice.

      if (isExtractDropped == isInsertDropped) {

        insertDimPos += 1;

      } else if (!isExtractDropped && isInsertDropped) {

        // Not enough extract dropped dims to match the insert dropped dims.

        return rewriter.notifyMatchFailure(insertSliceOp,

                                           "insert_slice drops more unit dims");

      }

      // If the dim is dropped by extract_slice and not by insert_slice, look

      // the next dim of extract_slice to see if it can match the current dim of

      // insert_slice.

    }

    // Can't match some insert dims.

    if (insertDimPos != insertDroppedDims.size()) {

      return rewriter.notifyMatchFailure(insertSliceOp,

                                         "insert_slice has unmatched dims");

    }


    rewriter.replaceOpWithNewOp<tensor::ExtractSliceOp>(

        insertSliceOp, insertSliceOp.getType(), extractSliceOp.getSource(),

        extractSliceOp.getMixedOffsets(), extractSliceOp.getMixedSizes(),

        extractSliceOp.getMixedStrides());

    rewriter.eraseOp(extractSliceOp);


    return success();

  }

};

} // namespace


void mlir::tensor::populateDropRedundantInsertSliceRankExpansionPatterns(

    RewritePatternSet &patterns) {

  patterns.add<DropRedundantRankExpansionOnExtractSliceOfInsertSlice,

               DropRedundantRankExpansionOnInsertSliceOfExtractSlice>(

      patterns.getContext());

}


success
return success()

OpDefinition.h

PatternMatch.h

ViewLikeInterfaceUtils.h

mlir::OpBuilder::setInsertionPoint
void setInsertionPoint(Block *block, Block::iterator insertPoint)
Set the insertion point to the specified location.
Definition Builders.h:400

mlir::RewritePatternSet
Definition PatternMatch.h:822

mlir::RewritePatternSet::getContext
MLIRContext * getContext() const
Definition PatternMatch.h:837

mlir::RewritePatternSet::add
RewritePatternSet & add(ConstructorArg &&arg, ConstructorArgs &&...args)
Add an instance of each of the pattern types 'Ts' to the pattern list with the given arguments.
Definition PatternMatch.h:861

mlir::RewriterBase::eraseOp
virtual void eraseOp(Operation *op)
This method erases an operation that is known to have no uses.
Definition PatternMatch.cpp:155

mlir::RewriterBase::notifyMatchFailure
std::enable_if_t<!std::is_convertible< CallbackT, Twine >::value, LogicalResult > notifyMatchFailure(Location loc, CallbackT &&reasonCallback)
Used to notify the listener that the IR failed to be rewritten because of a match failure,...
Definition PatternMatch.h:732

mlir::RewriterBase::replaceOpWithNewOp
OpTy replaceOpWithNewOp(Operation *op, Args &&...args)
Replace the results of the given (original) op with a new op that is created without verification (re...
Definition PatternMatch.h:529

Utils.h

Tensor.h

Transforms.h

BuiltinTypes.h

mlir::tensor
Definition BufferizationTransformOps.h:19

mlir::tensor::isCastLikeInsertSliceOp
bool isCastLikeInsertSliceOp(InsertSliceOp op)
A tensor.insert_slice is a cast-like operation if it merely rank-extends the source tensor or inserts...
Definition Utils.cpp:125

mlir::tensor::populateDropRedundantInsertSliceRankExpansionPatterns
void populateDropRedundantInsertSliceRankExpansionPatterns(RewritePatternSet &patterns)
Populates patterns with patterns that drop redundant tensor.insert_slice rank expansions.
Definition DropRedundantRankExpansionPatterns.cpp:177

mlir
Include the generated interface declarations.
Definition ABIRewriteContext.h:29

mlir::OpRewritePattern
OpRewritePattern is a wrapper around RewritePattern that allows for matching and rewriting against an...
Definition PatternMatch.h:314

mlir::OpRewritePattern::OpRewritePattern
OpRewritePattern(MLIRContext *context, PatternBenefit benefit=1, ArrayRef< StringRef > generatedNames={})
Patterns must specify the root operation name they match against, and can also specify the benefit of...
Definition PatternMatch.h:322