MLIR  20.0.0git
FusePadOpWithLinalgProducer.cpp
Go to the documentation of this file.
1 //===- FusePadOpWithLinalgProducer.cpp ---- Fuse pad with linalg producer -===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements patterns that fuses a linalg.generic -> tensor.pad op
10 // chain into a tensor.extract_slice -> linalg.generic -> tensor.insert_slice
11 // op chain.
12 //
13 //===----------------------------------------------------------------------===//
14 
16 
19 
20 using namespace mlir;
21 
22 namespace {
23 
24 /// A sequence of operations
25 ///
26 /// ```mlir
27 /// %0 = linalg. ...
28 /// %1 = tensor.pad %0 ...
29 /// ```
30 ///
31 /// can be replaced with
32 ///
33 /// ```mlir
34 /// %0 = linalg.fill
35 /// %1 = tensor.extract_slice %0 ...
36 /// %2 = linalg. .... outs(..., %1, ....) ....
37 /// %3 = tensor.insert_slice %2 into %1 ...
38 /// ```
39 ///
40 /// if the `linalg.generic` has all parallel iterator types.
41 struct FusePadOp : OpRewritePattern<tensor::PadOp> {
43 
44  LogicalResult matchAndRewrite(tensor::PadOp padOp,
45  PatternRewriter &rewriter) const override {
46  // Only works on padding op that sets the padded value to a constant.
47  Value padValue = padOp.getConstantPaddingValue();
48  if (!padValue)
49  return rewriter.notifyMatchFailure(padOp, "non constant padding");
50 
51  // This pattern could work for any Linalg op. For now restrict it to generic
52  // ops.
53  Value source = padOp.getSource();
54  auto linalgOp = source.getDefiningOp<linalg::GenericOp>();
55  if (!linalgOp) {
56  return rewriter.notifyMatchFailure(
57  padOp, "expected source to be linalg.generic op");
58  }
59  // All iterator types need to be parallel.
60  if (linalgOp.getNumLoops() != linalgOp.getNumParallelLoops()) {
61  return rewriter.notifyMatchFailure(
62  padOp, "only supported for ops with all parallel iterator types");
63  }
64  ReifiedRankedShapedTypeDims resultShape;
65  if (failed(reifyResultShapes(rewriter, padOp, resultShape)) ||
66  resultShape.size() != 1) {
67  return rewriter.notifyMatchFailure(
68  padOp, "failed to get shape of pad op result");
69  }
70 
71  Location loc = padOp.getLoc();
72 
73  // Create the tensor of same size as output of the pad op.
74  RankedTensorType padResultType = padOp.getResultType();
75  auto resultSizes = resultShape[0];
76  auto emptyTensor = rewriter.create<tensor::EmptyOp>(
77  loc, resultSizes, padResultType.getElementType());
78 
79  // Fill the tensor with the pad value.
80  // TODO: There is an option to fill only the boundaries. For now just
81  // filling the whole tensor.
82  auto fillTensor =
83  rewriter.create<linalg::FillOp>(loc, padValue, emptyTensor.getResult());
84 
85  // Construct a slice of the fill result that is to be replaced with the
86  // result of the generic op. The low pad values are the offsets, the size of
87  // the source is the size of the slice.
88  // TODO: This insert/extract could be potentially made a utility method.
89  unsigned resultNumber = cast<OpResult>(source).getResultNumber();
90  SmallVector<OpFoldResult> offsets = padOp.getMixedLowPad();
92  sizes.reserve(offsets.size());
93  for (const auto &shape :
94  llvm::enumerate(cast<RankedTensorType>(source.getType()).getShape())) {
95  if (ShapedType::isDynamic(shape.value())) {
96  sizes.push_back(
97  rewriter.create<tensor::DimOp>(loc, source, shape.index())
98  .getResult());
99  } else {
100  sizes.push_back(rewriter.getIndexAttr(shape.value()));
101  }
102  }
103  SmallVector<OpFoldResult> strides(offsets.size(), rewriter.getIndexAttr(1));
104  auto slice = rewriter.create<tensor::ExtractSliceOp>(
105  loc, fillTensor.getResult(0), offsets, sizes, strides);
106 
107  // Clone the generic op.
108  auto clonedOp =
109  cast<linalg::GenericOp>(rewriter.clone(*linalgOp.getOperation()));
110  clonedOp.setDpsInitOperand(resultNumber, slice.getResult());
111 
112  // Insert it back into the result of the fill.
113  rewriter.replaceOpWithNewOp<tensor::InsertSliceOp>(
114  padOp, clonedOp.getResult(resultNumber), fillTensor.getResult(0),
115  offsets, sizes, strides);
116  return success();
117  }
118 };
119 } // namespace
120 
123  patterns.add<FusePadOp>(patterns.getContext());
124 }
IntegerAttr getIndexAttr(int64_t value)
Definition: Builders.cpp:148
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
Definition: Location.h:66
Operation * clone(Operation &op, IRMapping &mapper)
Creates a deep copy of the specified operation, remapping any operands that use values outside of the...
Definition: Builders.cpp:588
Operation * create(const OperationState &state)
Creates an operation given the fields represented as an OperationState.
Definition: Builders.cpp:497
OpResult getResult(unsigned idx)
Get the 'idx'th result of this operation.
Definition: Operation.h:407
A special type of RewriterBase that coordinates the application of a rewrite pattern on the current I...
Definition: PatternMatch.h:791
std::enable_if_t<!std::is_convertible< CallbackT, Twine >::value, LogicalResult > notifyMatchFailure(Location loc, CallbackT &&reasonCallback)
Used to notify the listener that the IR failed to be rewritten because of a match failure,...
Definition: PatternMatch.h:724
OpTy replaceOpWithNewOp(Operation *op, Args &&...args)
Replace the results of the given (original) op with a new op that is created without verification (re...
Definition: PatternMatch.h:542
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96
Type getType() const
Return the type of this value.
Definition: Value.h:129
Operation * getDefiningOp() const
If this value is the result of an operation, return the operation that defines it.
Definition: Value.cpp:20
constexpr void enumerate(std::tuple< Tys... > &tuple, CallbackT &&callback)
Definition: Matchers.h:344
void populateFuseTensorPadWithProducerLinalgOpPatterns(RewritePatternSet &patterns)
Pattern to fuse a tensor.pad operation with the producer of its source, if the producer is a linalg o...
Include the generated interface declarations.
LogicalResult reifyResultShapes(OpBuilder &b, Operation *op, ReifiedRankedShapedTypeDims &reifiedReturnShapes)
Reify the shape of the result of an operation (typically in terms of the shape of its operands).
const FrozenRewritePatternSet & patterns
OpRewritePattern is a wrapper around RewritePattern that allows for matching and rewriting against an...
Definition: PatternMatch.h:358