doxygen/Padding_8cpp_source.html

 //===- Padding.cpp - Padding of Linalg ops --------------------------------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Dialect/Linalg/Transforms/Transforms.h"


 #include "mlir/Dialect/Bufferization/IR/Bufferization.h"

 #include "mlir/Dialect/Complex/IR/Complex.h"

 #include "mlir/Dialect/Linalg/IR/Linalg.h"

 #include "mlir/Dialect/Tensor/IR/Tensor.h"

 #include "mlir/Interfaces/ValueBoundsOpInterface.h"


 #define DEBUG_TYPE "linalg-padding"


 using namespace mlir;

 using namespace mlir::linalg;


 #define DBGS() (llvm::dbgs() << "[" DEBUG_TYPE << "]: ")

 #define DBGSNL() (llvm::dbgs() << "\n")


 /// Compute the padded shape of the given operand. The operand is padded to a

 /// static bounding box according to the specified padding options.

 static LogicalResult computePaddedShape(linalg::LinalgOp opToPad,

                                         OpOperand *opOperand,

                                         const LinalgPaddingOptions &options,

                                         SmallVector<int64_t> &paddedShape,

                                         bool &alreadyHasRequestedShape) {

   AffineMap indexingMap = opToPad.getMatchingIndexingMap(opOperand);

   ArrayRef<int64_t> shape = opToPad.getShape(opOperand);


   // Collect the shape dimensions that are a function of "paddingDimensions",

   // along with the multiple that they should be padded to ("1" if none).

   alreadyHasRequestedShape = true;

   DenseMap<int64_t, int64_t> shapeDimToMultiple;

   for (const auto &dimEn : enumerate(options.paddingDimensions)) {

     for (const auto &en : enumerate(indexingMap.getResults())) {

       if (en.value().isFunctionOfDim(dimEn.value())) {

         int64_t dimSize = shape[en.index()];

         if (options.padToMultipleOf.has_value()) {

           shapeDimToMultiple[en.index()] =

               (*options.padToMultipleOf)[dimEn.index()];

         } else {

           shapeDimToMultiple[en.index()] = 1;

         }

         if (ShapedType::isDynamic(dimSize)) {

           alreadyHasRequestedShape = false;

         } else if (dimSize % shapeDimToMultiple[en.index()] != 0) {

           alreadyHasRequestedShape = false;

         }

       }

     }

   }


   // Helper function to round a number up to a given multiple.

   auto ceil = [](int64_t val, int64_t multiple) {

     return ((val + multiple - 1) / multiple) * multiple;

   };


   // Upper bound the sizes to obtain a static bounding box.

   paddedShape.assign(shape.begin(), shape.end());

   for (int64_t i = 0, e = shape.size(); i < e; ++i) {

     LLVM_DEBUG(DBGS() << "--compute padded size for dim " << i << "\n");

     // Skip dimensions that do not require padding.

     if (!shapeDimToMultiple.contains(i)) {

       LLVM_DEBUG(DBGS() << "----dim does not require padding, SKIP\n");

       continue;

     }

     // Otherwise, try to compute a constant upper bound for the size value.

     FailureOr<int64_t> upperBound =

         ValueBoundsConstraintSet::computeConstantBound(

             presburger::BoundType::UB,

             {opOperand->get(),

              /*dim=*/i},

             /*stopCondition=*/nullptr, /*closedUB=*/true);

     if (failed(upperBound)) {

       LLVM_DEBUG(DBGS() << "----could not compute a bounding box for padding");

       return failure();

     }

     paddedShape[i] = ceil(*upperBound, shapeDimToMultiple[i]);

     LLVM_DEBUG(DBGS() << "----new dim size: " << paddedShape[i] << "\n");

   }


   return success();

 }


 /// Pad the `opOperand` in the "paddingDimensions" using the padding value and

 /// the nofold flag found in "paddingValues" and "nofoldFlags", respectively.

 ///

 /// Exit early and return the `opOperand` value if it already has the requested

 /// shape. i.e.:

 /// - static shape

 /// - nofold is not set

 /// - dim sizes are multiples of "padToMultipleOf"

 ///

 /// Otherwise, try to pad the shape dimensions that match the iterator

 /// dimensions "paddingDimensions" and return the tensor::PadOp result if

 /// padding succeeds or failure otherwise.

 static FailureOr<Value> padOperandToSmallestStaticBoundingBox(

     RewriterBase &rewriter, linalg::LinalgOp opToPad, OpOperand *opOperand,

     const LinalgPaddingOptions &options) {

   assert(

       (!options.padToMultipleOf.has_value() ||

        options.padToMultipleOf->size() == options.paddingDimensions.size()) &&

       "invalid number of elements in padToMultipleOf");


   // Compute padded shape.

   SmallVector<int64_t> paddedShape;

   bool alreadyHasRequestedShape = false;

   if (failed(computePaddedShape(opToPad, opOperand, options, paddedShape,

                                 alreadyHasRequestedShape)))

     return rewriter.notifyMatchFailure(opToPad,

                                        "--failed to compute padded shape");


   // Return the unpadded operand if padding to a static shape is not needed and

   // if the nofold flag is not set.

   bool nofold = opOperand->getOperandNumber() < options.nofoldFlags.size()

                     ? bool(options.nofoldFlags[opOperand->getOperandNumber()])

                     : false;

   if (!nofold && alreadyHasRequestedShape)

     return opOperand->get();


   // Fail if `paddingValues` specifies no padding value.

   if (opOperand->getOperandNumber() >= options.paddingValues.size()) {

     return rewriter.notifyMatchFailure(opToPad, "--no padding value specified");

   }

   Attribute paddingAttr = options.paddingValues[opOperand->getOperandNumber()];


   Value paddingValue;

   if (auto complexTy = dyn_cast<ComplexType>(

           getElementTypeOrSelf(opOperand->get().getType()))) {

     auto complexAttr = cast<ArrayAttr>(paddingAttr);

     paddingValue = rewriter.create<complex::ConstantOp>(opToPad.getLoc(),

                                                         complexTy, complexAttr);

   } else {

     paddingValue = rewriter.create<arith::ConstantOp>(

         opToPad.getLoc(), cast<TypedAttr>(paddingAttr));

   }


   // Pad the operand to the bounding box defined by `paddedShape`.

   auto paddedTensorType = RankedTensorType::get(

       paddedShape, getElementTypeOrSelf(opOperand->get()));

   LLVM_DEBUG(DBGS() << "--SUCCESS, makeComposedPadHighOp with type: "

                     << paddedTensorType);

   return makeComposedPadHighOp(rewriter, opToPad->getLoc(), paddedTensorType,

                                opOperand->get(), paddingValue, nofold);

 }


 LogicalResult

 linalg::rewriteAsPaddedOp(RewriterBase &rewriter, LinalgOp opToPad,

                           const LinalgPaddingOptions &constOptions,

                           LinalgOp &paddedOp, SmallVector<Value> &replacements,

                           SmallVector<tensor::PadOp> &padOps) {

   LLVM_DEBUG(DBGS() << "Start rewriteAsPaddedOp : " << opToPad << "\n");

   Location loc = opToPad->getLoc();


   LinalgPaddingOptions options(constOptions);

   // Allow inference of pad values if they are not explicitly specified.

   // TODO: be mindful about the value depending on the actual operation.

   if (options.paddingValues.empty()) {

     SmallVector<Type> types(opToPad->getOperandTypes());

     llvm::append_range(types, opToPad->getResultTypes());

     for (Type t : types) {

       options.paddingValues.push_back(

           rewriter.getZeroAttr(getElementTypeOrSelf(t)));

     }

   }


   // TODO: there are cases where we may still want to pad to larger sizes.

   if (!opToPad.hasPureTensorSemantics())

     return rewriter.notifyMatchFailure(opToPad,

                                        "expected operation on tensors");


   OpBuilder::InsertionGuard g(rewriter);

   // Set IP after op because we also take the dims of the original output.

   rewriter.setInsertionPointAfter(opToPad);


   // Make a copy of the shaped operands and update it.

   SmallVector<Value> newOperands;

   newOperands.reserve(opToPad->getNumOperands());

   for (OpOperand &opOperand : opToPad->getOpOperands()) {

     FailureOr<Value> paddedOperand = padOperandToSmallestStaticBoundingBox(

         rewriter, opToPad, &opOperand, options);

     // Exit if `paddingDimensions` cannot be bounded statically.

     if (failed(paddedOperand)) {

       LLVM_DEBUG(DBGS() << "--operand cannot be bound statically : "

                         << opOperand.get() << " -> FAIL\n");

       return rewriter.notifyMatchFailure(opToPad,

                                          "operand cannot be bound statically");

     }

     newOperands.push_back(*paddedOperand);

     if (auto padOp = paddedOperand->getDefiningOp<tensor::PadOp>())

       padOps.push_back(padOp);

   }


   ReifiedRankedShapedTypeDims reifiedResultShapes;

   if (failed(reifyResultShapes(rewriter, opToPad, reifiedResultShapes))) {

     LLVM_DEBUG(DBGS() << "--failed to reify result shapes -> FAIL\n");

     return rewriter.notifyMatchFailure(opToPad,

                                        "failed to reify result shapes");

   }

   assert(reifiedResultShapes.size() == opToPad->getNumResults() &&

          "expected same number of results");


   // Clone `opToPad` to operate on the statically padded shapes.

   auto resultTensorTypes =

       ValueRange(newOperands).take_back(opToPad.getNumDpsInits()).getTypes();

   // clone **should** properly notify the rewriter.

   paddedOp = clone(rewriter, opToPad, resultTensorTypes, newOperands);

   LLVM_DEBUG(DBGS() << "--cloned padded op: " << paddedOp << "\n");


   // Recover the slice out of the new static results. This keeps the original

   // linalg op around because it uses the dims of the original results.

   SmallVector<Value> paddedSubtensorResults;

   paddedSubtensorResults.reserve(opToPad->getNumResults());

   for (const auto &en : llvm::enumerate(paddedOp->getResults())) {

     Value paddedResult = en.value();

     int64_t resultNumber = en.index();

     int64_t rank = cast<RankedTensorType>(paddedResult.getType()).getRank();

     SmallVector<OpFoldResult> offsets(rank, rewriter.getIndexAttr(0));

     SmallVector<OpFoldResult> strides(rank, rewriter.getIndexAttr(1));

     paddedSubtensorResults.push_back(rewriter.create<tensor::ExtractSliceOp>(

         loc, paddedResult, offsets, reifiedResultShapes[resultNumber],

         strides));

   }


   if (options.copyBackOp == LinalgPaddingOptions::CopyBackOp::None) {

     replacements = std::move(paddedSubtensorResults);

     return success();

   }


   // Copy back unpadded results to the original destination (i.e., inits of the

   // linalg op), so that the destination buffer of the computation does not

   // change. If the padding folds away, this will materialize as a memcpy

   // between two identical buffers, which will then also fold away.

   assert(static_cast<int64_t>(paddedSubtensorResults.size()) ==

              opToPad.getNumDpsInits() &&

          "expected matching number of results");

   for (auto it :

        llvm::zip(paddedSubtensorResults, opToPad.getDpsInitsMutable())) {

     if (options.copyBackOp == LinalgPaddingOptions::CopyBackOp::LinalgCopy) {

       replacements.push_back(rewriter

                                  .create<linalg::CopyOp>(loc, std::get<0>(it),

                                                          std::get<1>(it).get())

                                  .getResult(0));

     } else if (options.copyBackOp ==

                LinalgPaddingOptions::CopyBackOp::

                    BufferizationMaterializeInDestination) {

       replacements.push_back(

           rewriter

               .create<bufferization::MaterializeInDestinationOp>(

                   loc, std::get<0>(it), std::get<1>(it).get())

               ->getResult(0));

     } else {

       llvm_unreachable("unsupported copy back op");

     }

   }

   return success();

 }


 FailureOr<LinalgOp>

 mlir::linalg::padAndHoistLinalgOp(RewriterBase &rewriter, LinalgOp linalgOp,

                                   const LinalgPaddingOptions &options) {

   assert(options.copyBackOp == LinalgPaddingOptions::CopyBackOp::None &&

          "invalid options");


   if (!linalgOp.hasPureTensorSemantics())

     return rewriter.notifyMatchFailure(

         linalgOp, "only applies to Linalg ops with tensor semantics");


   // Pad the operation.

   LinalgOp paddedOp;

   SmallVector<Value> newResults;

   SmallVector<tensor::PadOp> padOps;

   if (failed(rewriteAsPaddedOp(rewriter, linalgOp, options, paddedOp,

                                newResults, padOps)))

     return rewriter.notifyMatchFailure(linalgOp,

                                        "failed to rewrite as a padded op");


   // Hoist the padding.

   for (const auto &en : enumerate(options.hoistPaddings)) {

     if (static_cast<int64_t>(en.index()) >= paddedOp->getNumOperands())

       break;

     OpOperand &opOperand = paddedOp->getOpOperand(en.index());

     auto padOp = opOperand.get().getDefiningOp<tensor::PadOp>();

     if (!padOp || en.value() == 0) {

       (void)rewriter.notifyMatchFailure(linalgOp, "not a tensor.pad -- skip");

       continue;

     }


     // Fail hoisting if the operand shape is not fully static.

     if (llvm::any_of(paddedOp.getShape(&opOperand), ShapedType::isDynamic)) {

       (void)rewriter.notifyMatchFailure(linalgOp,

                                         "non static padding shape -- skip");

       continue;

     }


     tensor::PadOp hoistedOp;

     SmallVector<TransposeOp> transposeOps;

     SmallVector<int64_t> transposeVector =

         en.index() < options.transposePaddings.size()

             ? options.transposePaddings[en.index()]

             : SmallVector<int64_t>{};


     FailureOr<Value> newResult = hoistPaddingOnTensors(

         padOp, en.value(), transposeVector, hoistedOp, transposeOps);

     if (failed(newResult)) {

       (void)rewriter.notifyMatchFailure(linalgOp,

                                         "failed to apply hoistPadding");

       continue;

     }

     rewriter.replaceOp(padOp, *newResult);

   }


   // Replace the original operation to pad.

   rewriter.replaceOp(linalgOp, newResults);


   return paddedOp;

 }

Bufferization.h

Complex.h

padOperandToSmallestStaticBoundingBox
static FailureOr< Value > padOperandToSmallestStaticBoundingBox(RewriterBase &rewriter, linalg::LinalgOp opToPad, OpOperand *opOperand, const LinalgPaddingOptions &options)
Pad the opOperand in the "paddingDimensions" using the padding value and the nofold flag found in "pa...
Definition: Padding.cpp:102

computePaddedShape
static LogicalResult computePaddedShape(linalg::LinalgOp opToPad, OpOperand *opOperand, const LinalgPaddingOptions &options, SmallVector< int64_t > &paddedShape, bool &alreadyHasRequestedShape)
Compute the padded shape of the given operand.
Definition: Padding.cpp:27

DBGS
#define DBGS()
Definition: Padding.cpp:22

options
static llvm::ManagedStatic< PassManagerOptions > options
Definition: PassManagerOptions.cpp:89

ValueBoundsOpInterface.h

llvm::ArrayRef
Definition: LLVM.h:48

llvm::DenseMap
Definition: LLVM.h:55

llvm::SmallVector
Definition: LLVM.h:72

mlir::AffineMap
A multi-dimensional affine map Affine map's are immutable like Type's, and they are uniqued.
Definition: AffineMap.h:46

mlir::AffineMap::getResults
ArrayRef< AffineExpr > getResults() const
Definition: AffineMap.cpp:407

mlir::Attribute
Attributes are known-constant values of operations.
Definition: Attributes.h:25

mlir::Builder::getIndexAttr
IntegerAttr getIndexAttr(int64_t value)
Definition: Builders.cpp:106

mlir::Builder::getZeroAttr
TypedAttr getZeroAttr(Type type)
Definition: Builders.cpp:322

mlir::IROperand::get
IRValueT get() const
Return the current value being used by this operand.
Definition: UseDefLists.h:160

mlir::Location
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
Definition: Location.h:76

mlir::OpBuilder::InsertionGuard
RAII guard to reset the insertion point of the builder when destroyed.
Definition: Builders.h:346

mlir::OpBuilder::create
Operation * create(const OperationState &state)
Creates an operation given the fields represented as an OperationState.
Definition: Builders.cpp:455

mlir::OpBuilder::setInsertionPointAfter
void setInsertionPointAfter(Operation *op)
Sets the insertion point to the node after the specified operation, which will cause subsequent inser...
Definition: Builders.h:410

mlir::OpOperand
This class represents an operand of an operation.
Definition: Value.h:257

mlir::OpOperand::getOperandNumber
unsigned getOperandNumber()
Return which operand this is in the OpOperand list of the Operation.
Definition: Value.cpp:228

mlir::RewriterBase
This class coordinates the application of a rewrite on a set of IR, providing a way for clients to tr...
Definition: PatternMatch.h:358

mlir::RewriterBase::notifyMatchFailure
std::enable_if_t<!std::is_convertible< CallbackT, Twine >::value, LogicalResult > notifyMatchFailure(Location loc, CallbackT &&reasonCallback)
Used to notify the listener that the IR failed to be rewritten because of a match failure,...
Definition: PatternMatch.h:682

mlir::RewriterBase::replaceOp
virtual void replaceOp(Operation *op, ValueRange newValues)
Replace the results of the given (original) operation with the specified list of values (replacements...
Definition: PatternMatch.cpp:129

mlir::Type
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
Definition: Types.h:74

mlir::ValueBoundsConstraintSet::computeConstantBound
static FailureOr< int64_t > computeConstantBound(presburger::BoundType type, const Variable &var, StopConditionFn stopCondition=nullptr, bool closedUB=false)
Compute a constant bound for the given variable.
Definition: ValueBoundsOpInterface.cpp:630

mlir::ValueRange
This class provides an abstraction over the different types of ranges over Values.
Definition: ValueRange.h:387

mlir::ValueRange::getTypes
type_range getTypes() const

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

mlir::Value::getType
Type getType() const
Return the type of this value.
Definition: Value.h:105

mlir::Value::getDefiningOp
Operation * getDefiningOp() const
If this value is the result of an operation, return the operation that defines it.
Definition: Value.cpp:20

Linalg.h

Transforms.h

Tensor.h

mlir::detail::enumerate
constexpr void enumerate(std::tuple< Tys... > &tuple, CallbackT &&callback)
Definition: Matchers.h:344

mlir::linalg
Definition: LinalgToStandard.h:24

mlir::linalg::rewriteAsPaddedOp
LogicalResult rewriteAsPaddedOp(RewriterBase &rewriter, LinalgOp opToPad, const LinalgPaddingOptions &options, LinalgOp &paddedOp, SmallVector< Value > &replacements, SmallVector< tensor::PadOp > &padOps)
Pad the iterator dimensions paddingDimensions of all opToPad operands to a static bounding box.
Definition: Padding.cpp:153

mlir::linalg::hoistPaddingOnTensors
FailureOr< Value > hoistPaddingOnTensors(RewriterBase &rewriter, tensor::PadOp opToHoist, int64_t numLoops, ArrayRef< int64_t > transposeVector, tensor::PadOp &hoistedOp, SmallVectorImpl< TransposeOp > &transposeOps)
Mechanically hoist padding operations on tensors by numLoops into a new, generally larger tensor.
Definition: HoistPadding.cpp:943

mlir::linalg::makeComposedPadHighOp
Value makeComposedPadHighOp(OpBuilder &b, Location loc, RankedTensorType type, Value source, Value pad, bool nofold)
Create a tensor::PadOp that pads source to the size of the statically sized type whose static sizes a...
Definition: Utils.cpp:246

mlir::linalg::padAndHoistLinalgOp
FailureOr< LinalgOp > padAndHoistLinalgOp(RewriterBase &rewriter, LinalgOp linalgOp, const LinalgPaddingOptions &options)
Apply padding and hoisting to linalgOp according to the configuration specified in options.
Definition: Padding.cpp:265

mlir::presburger::BoundType::UB
@ UB

mlir::presburger::ceil
DynamicAPInt ceil(const Fraction &f)
Definition: Fraction.h:79

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::reifyResultShapes
LogicalResult reifyResultShapes(OpBuilder &b, Operation *op, ReifiedRankedShapedTypeDims &reifiedReturnShapes)
Reify the shape of the result of an operation (typically in terms of the shape of its operands).
Definition: InferTypeOpInterface.cpp:27

mlir::getElementTypeOrSelf
Type getElementTypeOrSelf(Type type)
Return the element type or return the type itself.
Definition: TypeUtilities.cpp:23

mlir::clone
Operation * clone(OpBuilder &b, Operation *op, TypeRange newResultTypes, ValueRange newOperands)
Definition: StructuredOpsUtils.cpp:197

mlir::get
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
Definition: BytecodeImplementation.h:509

mlir::linalg::LinalgPaddingOptions
Definition: Transforms.h:279

mlir::linalg::LinalgPaddingOptions::CopyBackOp
CopyBackOp
Definition: Transforms.h:319

mlir::linalg::LinalgPaddingOptions::CopyBackOp::None
@ None

mlir::linalg::LinalgPaddingOptions::CopyBackOp::LinalgCopy
@ LinalgCopy