doxygen/TileUsingInterface_8h_source.html

 //===- TileUsingInterface.h - Tiling ops using TilingInterface --*- C++ -*-===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #ifndef MLIR_DIALECT_SCF_TRANSFORMS_TILEUSINGINTERFACE_H

 #define MLIR_DIALECT_SCF_TRANSFORMS_TILEUSINGINTERFACE_H


 #include "mlir/Dialect/SCF/IR/SCF.h"

 #include "mlir/Dialect/Tensor/Transforms/Transforms.h"

 #include "mlir/IR/PatternMatch.h"

 #include "mlir/Interfaces/LoopLikeInterface.h"

 #include "mlir/Interfaces/TilingInterface.h"

 #include "mlir/Interfaces/ViewLikeInterface.h"

 #include "mlir/Rewrite/FrozenRewritePatternSet.h"


 #include <deque>


 namespace mlir {

 class Operation;

 class RewriterBase;

 class TilingInterface;

 } // namespace mlir


 namespace mlir {

 namespace scf {


 using SCFTileSizeComputationFunction =

     std::function<SmallVector<OpFoldResult>(OpBuilder &, Operation *)>;


 /// Options to use to control tiling.

 struct SCFTilingOptions {

   /// Computation function that returns the tile sizes to use for each loop.

   /// Returning a tile size of zero implies no tiling for that loop. If the

   /// size of the returned vector is smaller than the number of loops, the inner

   /// loops are not tiled. If the size of the returned vector is larger, then

   /// the vector is truncated to number of loops.

   SCFTileSizeComputationFunction tileSizeComputationFunction = nullptr;


   SCFTilingOptions &

   setTileSizeComputationFunction(SCFTileSizeComputationFunction fun) {

     tileSizeComputationFunction = std::move(fun);

     return *this;

   }

   /// Convenience function to set the `tileSizeComputationFunction` to a

   /// function that computes tile sizes at the point they are needed. Allows

   /// proper interaction with folding.

   SCFTilingOptions &setTileSizes(ArrayRef<OpFoldResult> tileSizes);


   /// Computation function that returns the number of threads to use for

   /// each loop. Returning a num threads of zero implies no tiling for that

   /// loop. If the size of the returned vector is smaller than the number of

   /// loops, the inner loops are not tiled. If the size of the returned vector

   /// is larger, then the vector is truncated to number of loops. Note: This

   /// option is only supported with loopType set to `LoopType::ForallOp`. If the

   /// tile size function is not specified while the num threads computation is,

   /// then the tile size is determined automatically to map at most one tile per

   /// thread.

   SCFTileSizeComputationFunction numThreadsComputationFunction = nullptr;


   SCFTilingOptions &

   setNumThreadsComputationFunction(SCFTileSizeComputationFunction fun) {

     numThreadsComputationFunction = std::move(fun);

     return *this;

   }

   /// Convenience function to set the `numThreadsComputationFunction` to a

   /// function that computes num threads at the point they are needed.

   SCFTilingOptions &setNumThreads(ArrayRef<OpFoldResult> numThreads);


   /// The interchange vector to reorder the tiled loops.

   SmallVector<int64_t> interchangeVector = {};

   SCFTilingOptions &setInterchange(ArrayRef<int64_t> interchange) {

     interchangeVector = llvm::to_vector(interchange);

     return *this;

   }


   /// Specify which loop construct to use for tile and fuse.

   enum class LoopType { ForOp, ForallOp };

   LoopType loopType = LoopType::ForOp;

   SCFTilingOptions &setLoopType(LoopType type) {

     loopType = type;

     return *this;

   }


   /// Specify how reduction dimensions should be tiled.

   ///

   /// Tiling can be thought of as splitting a dimension into 2 and materializing

   /// the outer dimension as a loop:

   ///

   /// op[original] -> op[original / x, x] -> loop[original] { op[x] }

   ///

   /// For parallel dimensions, the split can only happen in one way, with both

   /// dimensions being parallel. For reduction dimensions however, there is a

   /// choice in how we split the reduction dimension. This enum exposes this

   /// choice.

   enum class ReductionTilingStrategy {

     // [reduction] -> [reduction1, reduction2]

     // -> loop[reduction1] { [reduction2] }

     FullReduction,

     // [reduction] -> [reduction1, parallel2]

     // -> loop[reduction1] { [parallel2] }; merge[reduction1]

     PartialReductionOuterReduction,

     // [reduction] -> [parallel1, reduction2]

     // -> loop[parallel1] { [reduction2] }; merge[parallel1]

     PartialReductionOuterParallel

   };

   ReductionTilingStrategy reductionStrategy =

       ReductionTilingStrategy::FullReduction;

   SCFTilingOptions &

   setReductionTilingStrategy(ReductionTilingStrategy strategy) {

     reductionStrategy = strategy;

     return *this;

   }


   /// Specify mapping of loops to devices. This is only respected when the loop

   /// constructs support such a mapping (like `scf.forall`). Will be ignored

   /// when using loop constructs that dont support such a mapping (like

   /// `scf.for`)

   SmallVector<Attribute> mappingVector = {};

   SCFTilingOptions &setMapping(ArrayRef<Attribute> mapping) {

     mappingVector = llvm::to_vector(mapping);

     return *this;

   }

 };


 /// Transformation information returned after tiling.

 struct SCFTilingResult {

   /// Tiled operations that are generated during tiling. The order does not

   /// matter except the last op. The replacements are expected to be the results

   /// of the last op.

   SmallVector<Operation *> tiledOps;

   /// The initial destination values passed to the tiled operations.

   SmallVector<Value> initialValues;

   /// The `scf.for` operations that iterate over the tiles.

   SmallVector<LoopLikeOpInterface> loops;

   /// The result generated by the loop nest in tiling, may hold partial results,

   /// which need to be merged to match the computation of the untiled operation.

   /// `mergeResult` contains the operations used to perform this merge from

   /// partial results and the values that can be used as replacements of

   /// the untiled operation.

   MergeResult mergeResult;

   /// Slices generated after tiling that can be used for fusing with the tiled

   /// producer.

   SmallVector<Operation *> generatedSlices;

 };


 /// Method to tile an op that implements the `TilingInterface` using

 /// `scf.for` for iterating over the tiles.

 FailureOr<SCFTilingResult> tileUsingSCF(RewriterBase &rewriter,

                                         TilingInterface op,

                                         const SCFTilingOptions &options);


 /// Options used to control tile + fuse.

 struct SCFTileAndFuseOptions {

   /// The tiling options used to control the tiling of the consumer.

   SCFTilingOptions tilingOptions;

   SCFTileAndFuseOptions &setTilingOptions(SCFTilingOptions options) {

     tilingOptions = options;

     return *this;

   }


   /// Control function to check if a slice needs to be fused or not,

   /// The control function receives

   /// 1) the slice along which fusion is to be done,

   /// 2) the producer value that is to be fused

   /// 3) a boolean value set to `true` if the fusion is from

   ///    a destination operand.

   /// The control function returns an `std::optiona<ControlFnResult>`.

   /// If the return value is `std::nullopt`, that implies no fusion

   /// is to be performed along that slice.

   struct ControlFnResult {

     /// Set to true if the loop nest has to return a replacement value

     /// for the fused producer.

     bool yieldProducerReplacement = false;

   };

   using ControlFnTy = std::function<std::optional<ControlFnResult>(

       tensor::ExtractSliceOp candidateSliceOp, OpResult originalProducer,

       bool isDestinationOperand)>;

   /// The default control function implements greedy fusion without yielding

   /// a replacement for any of the fused results.

   ControlFnTy fusionControlFn = [](tensor::ExtractSliceOp, OpResult,

                                    bool) -> std::optional<ControlFnResult> {

     return ControlFnResult{};

   };

   SCFTileAndFuseOptions &setFusionControlFn(ControlFnTy controlFn) {

     fusionControlFn = controlFn;

     return *this;

   }


   /// An optional set of rewrite patterns to apply to the results of tiling

   /// before fusion. This will track deleted and newly inserted

   /// `tensor.extract_slice` ops and update the worklist.

   std::optional<FrozenRewritePatternSet> cleanupPatterns = std::nullopt;

 };


 /// Fuse the producer of the source of `candidateSliceOp` by computing the

 /// required slice of the producer in-place.  Note that the method

 /// replaces the uses of `candidateSliceOp` with the tiled and fused producer

 /// value but does not delete the slice operation.

 struct SCFFuseProducerOfSliceResult {

   OpResult origProducer;       // Original untiled producer.

   Value tiledAndFusedProducer; // Tile and fused producer value.

   SmallVector<Operation *> tiledOps;

   SmallVector<Operation *> generatedSlices;

 };

 std::optional<SCFFuseProducerOfSliceResult>

 tileAndFuseProducerOfSlice(RewriterBase &rewriter,

                            tensor::ExtractSliceOp candidateSliceOp,

                            MutableArrayRef<LoopLikeOpInterface> loops);


 /// Reconstruct the fused producer from within the tiled-and-fused code. Based

 /// on the slice of the producer computed in place it is possible that within

 /// the loop nest same slice of the producer is computed multiple times. It is

 /// in general not possible to recompute the value of the fused producer from

 /// the tiled loop code in such cases. For the cases where no slice of the

 /// producer is computed in a redundant fashion it is possible to reconstruct

 /// the value of the original producer from within the tiled loop. It is upto

 /// the caller to ensure that the producer is not computed redundantly within

 /// the tiled loop nest. For example, consider

 ///

 /// ```mlir

 /// %0 = linalg.matmul ins(...) outs(...) -> tensor<?x?xf32>

 /// %1 = linalg.matmul ins(%0, ..) outs(...) -> tensor<?x?x?f32>

 /// ```

 ///

 /// If `%1` is tiled in a 2D fashion and `%0` is fused with it, the resulting IR

 /// is,

 ///

 /// ```mlir

 /// %t1_0 = scf.for .... iter_args(%arg0 = ...) {

 ///   %t1_1 = scf.for ... iter_args(%arg1 = %arg0) {

 ///     ...

 ///     %t1_2 = linalg.matmul ins(...) outs(...) -> tensor<?x?xf32>

 ///     %t1_3 = linalg.matmul ins(%t1_2, ...)

 ///     %t1_4 = tensor.insert_slice %t1_3 into %arg1 ...

 ///     scf.yield %t1_4

 ///   }

 ///   scf.yield %t1_1

 /// }

 /// ```

 ///

 /// Here `%t1_2` is the same for all iterations of the inner `scf.for`. Instead

 /// if `%1` were tiled only along the rows, the resultant code would be

 ///

 /// ```mlir

 /// %t2_0 = scf.for .... iter_args(%arg0 = ...) {

 ///   ...

 ///   %t2_1 = linalg.matmul ins(...) outs(...) -> tensor<?x?xf32>

 ///   %t2_2 = linalg.matmul ins(%t2_1, ...)

 ///   %t2_3 = tensor.insert_slice %t2_2 into %arg0 ...

 ///   scf.yield %t2_3

 /// }

 /// ```

 ///

 /// Here there is no intersection in the different slices of `%t2_1` computed

 /// across iterations of the `scf.for`. In such cases, the value of the original

 /// `%0` can be reconstructed from within the loop body. This is useful in cases

 /// where `%0` had other uses as well. If not reconstructed from within the loop

 /// body, uses of `%0` could not be replaced, making it still live and the

 /// fusion immaterial.

 ///

 /// The @param `yieldResultNumber` decides which result would be yield. If not

 /// given, yield all `opResult` of fused producer.

 ///

 /// The method returns the list of new slices added during the process (which

 /// can be used to fuse along).

 FailureOr<SmallVector<Operation *>> yieldReplacementForFusedProducer(

     RewriterBase &rewriter, tensor::ExtractSliceOp sliceOp,

     scf::SCFFuseProducerOfSliceResult fusedProducerInfo,

     MutableArrayRef<LoopLikeOpInterface> loops,

     ArrayRef<unsigned> yieldResultNumber = ArrayRef<unsigned>{});


 /// Transformation information returned after tile and fuse.

 struct SCFTileAndFuseResult {

   /// List of untiled operations that were fused with the tiled consumer.

   llvm::SetVector<Operation *> fusedProducers;

   /// List of tiled and fused operations generated. The first one in this list

   /// is guaranteed to be the tiled operations generated during tiling of the

   /// generated operation.

   llvm::SetVector<Operation *> tiledAndFusedOps;

   /// The `scf.for` operations that iterate over the tiles.

   SmallVector<LoopLikeOpInterface> loops;

   /// The replacement values to use for the tiled and fused operations.

   llvm::DenseMap<Value, Value> replacements;

 };


 /// Method to tile and fuse a sequence of operations, by tiling the consumer

 /// and fusing its producers. Note that this assumes that it is valid to

 /// tile+fuse the producer into the innermost tiled loop. Its up to the caller

 /// to ensure that the tile sizes provided make this fusion valid.

 ///

 /// For example, for the following sequence

 ///

 /// ```mlir

 /// %0 =

 /// %1 = linalg.fill ... outs(%0 : ... )

 /// %2 = linalg.matmul ... outs(%1 : ...) ...

 /// ```

 ///

 /// it is legal to fuse the fill with the matmul only if the matmul is tiled

 /// along the parallel dimensions and not the reduction dimension, i.e. the tile

 /// size for the reduction dimension should be 0. The resulting fused

 /// transformation is

 ///

 /// ```mlir

 /// %1 = scf.for ... iter_args(%arg0 = %0)

 ///   %2 = tensor.extract_slice %arg0

 ///   %3 = linalg.fill .. outs(%2 : ... )

 ///   %4 = linalg.matmul .. outs(%3 : ...)

 /// }

 /// ```

 FailureOr<SCFTileAndFuseResult>

 tileConsumerAndFuseProducersUsingSCF(RewriterBase &rewriter,

                                      TilingInterface consumer,

                                      const SCFTileAndFuseOptions &options);


 /// Fuse the consumer of the source of `candidateSliceOp` by computing the

 /// required slice of the consumer in-place.  Note that the method

 /// replaces the uses of `candidateSliceOp` with the tiled and fused consumer

 /// value but does not delete the slice operation.

 struct SCFFuseConsumerOfSliceResult {

   OpOperand *origConsumerOperand; // Original untiled consumer's operand.

   OpOperand

       *tiledAndFusedConsumerOperand; // Tiled and fused consumer's operand.

   SmallVector<Operation *> tiledOps;

 };

 FailureOr<scf::SCFFuseConsumerOfSliceResult>

 tileAndFuseConsumerOfSlice(RewriterBase &rewriter, Operation *candidateSliceOp,

                            MutableArrayRef<LoopLikeOpInterface> loops);


 /// Method to lower an `op` that implements the `TilingInterface` to

 /// loops/scalars.

 FailureOr<SmallVector<scf::ForOp>>

 lowerToLoopsUsingSCFForOp(RewriterBase &rewriter, TilingInterface op);


 /// Method to tile a reduction and generate a parallel op within a serial loop.

 /// Each of the partial reductions are calculated in parallel. Then after the

 /// loop all the partial reduction are merged into a final reduction.

 /// For example for the following sequence

 ///

 /// ```mlir

 /// %0 = linalg.generic %in ["parallel", "reduction"]

 ///   : tensor<7x9xf32> -> tensor<7xf32>

 /// ```

 ///

 /// into:

 ///

 /// ```mlir

 /// %0 = linalg.fill ... : tensor<7x4xf32>

 /// %1 = scf.for ... iter_args(%arg0 = %0)

 ///   %2 = tensor.extract_slice %arg0 : tensor<7x4xf32> -> tensor<7x?xf32>

 ///   %3 = tensor.extract_slice %in : tensor<7x9xf32> -> tensor<7x?xf32>

 ///   %4 = linalg.generic %2, %3 ["parallel", "parallel"]

 ///     : tensor<7x?xf32> -> tensor<7x?xf32>

 ///   %5 = tensor.insert_slice %3, %0[0, 0] : tensor<7x4xf32>

 /// }

 /// %6 = linalg.generic %1 ["parallel", "reduction"]

 ///   : tensor<7x4xf32> -> tensor<7xf32>

 /// ```

 FailureOr<scf::SCFTilingResult>

 tileReductionUsingScf(RewriterBase &b, PartialReductionOpInterface op,

                       ArrayRef<OpFoldResult> tileSize);


 } // namespace scf

 } // namespace mlir


 #endif // MLIR_DIALECT_SCF_TRANSFORMS_TILEUSINGINTERFACE_H

FrozenRewritePatternSet.h

LoopLikeInterface.h

options
static llvm::ManagedStatic< PassManagerOptions > options
Definition: PassManagerOptions.cpp:89

PatternMatch.h

TilingInterface.h

ViewLikeInterface.h

llvm::ArrayRef
Definition: LLVM.h:48

llvm::DenseMap< Value, Value >

llvm::MutableArrayRef
Definition: LLVM.h:62

llvm::SetVector
Definition: LLVM.h:66

llvm::SmallVector
Definition: LLVM.h:72

mlir::OpBuilder
This class helps build Operations.
Definition: Builders.h:204

mlir::OpOperand
This class represents an operand of an operation.
Definition: Value.h:243

mlir::OpResult
This is a value defined by a result of an operation.
Definition: Value.h:433

mlir::Operation
Operation is the basic unit of execution within MLIR.
Definition: Operation.h:88

mlir::RewriterBase
This class coordinates the application of a rewrite on a set of IR, providing a way for clients to tr...
Definition: PatternMatch.h:358

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

SCF.h

Transforms.h

mlir::scf::tileAndFuseConsumerOfSlice
FailureOr< scf::SCFFuseConsumerOfSliceResult > tileAndFuseConsumerOfSlice(RewriterBase &rewriter, Operation *candidateSliceOp, MutableArrayRef< LoopLikeOpInterface > loops)
Implementation of fusing consumer of a single slice by computing the slice of the consumer in-place f...
Definition: TileUsingInterface.cpp:1991

mlir::scf::tileUsingSCF
FailureOr< SCFTilingResult > tileUsingSCF(RewriterBase &rewriter, TilingInterface op, const SCFTilingOptions &options)
Method to tile an op that implements the TilingInterface using scf.for for iterating over the tiles.
Definition: TileUsingInterface.cpp:933

mlir::scf::lowerToLoopsUsingSCFForOp
FailureOr< SmallVector< scf::ForOp > > lowerToLoopsUsingSCFForOp(RewriterBase &rewriter, TilingInterface op)
Method to lower an op that implements the TilingInterface to loops/scalars.
Definition: TileUsingInterface.cpp:2219

mlir::scf::yieldReplacementForFusedProducer
FailureOr< SmallVector< Operation * > > yieldReplacementForFusedProducer(RewriterBase &rewriter, tensor::ExtractSliceOp sliceOp, scf::SCFFuseProducerOfSliceResult fusedProducerInfo, MutableArrayRef< LoopLikeOpInterface > loops, ArrayRef< unsigned > yieldResultNumber=ArrayRef< unsigned >{})
Reconstruct the fused producer from within the tiled-and-fused code.
Definition: TileUsingInterface.cpp:1252

mlir::scf::tileConsumerAndFuseProducersUsingSCF
FailureOr< SCFTileAndFuseResult > tileConsumerAndFuseProducersUsingSCF(RewriterBase &rewriter, TilingInterface consumer, const SCFTileAndFuseOptions &options)
Method to tile and fuse a sequence of operations, by tiling the consumer and fusing its producers.
Definition: TileUsingInterface.cpp:1523

mlir::scf::tileReductionUsingScf
FailureOr< scf::SCFTilingResult > tileReductionUsingScf(RewriterBase &b, PartialReductionOpInterface op, ArrayRef< OpFoldResult > tileSize)
Method to tile a reduction and generate a parallel op within a serial loop.
Definition: TileUsingInterface.cpp:1084

mlir::scf::SCFTileSizeComputationFunction
std::function< SmallVector< OpFoldResult >(OpBuilder &, Operation *)> SCFTileSizeComputationFunction
Definition: TileUsingInterface.h:32

mlir::scf::tileAndFuseProducerOfSlice
std::optional< SCFFuseProducerOfSliceResult > tileAndFuseProducerOfSlice(RewriterBase &rewriter, tensor::ExtractSliceOp candidateSliceOp, MutableArrayRef< LoopLikeOpInterface > loops)
Implementation of fusing producer of a single slice by computing the slice of the producer in-place.
Definition: TileUsingInterface.cpp:1137

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::MergeResult
Container for the result of merge operation of tiling.
Definition: TilingInterface.h:43

mlir::scf::SCFFuseConsumerOfSliceResult
Fuse the consumer of the source of candidateSliceOp by computing the required slice of the consumer i...
Definition: TileUsingInterface.h:324

mlir::scf::SCFFuseConsumerOfSliceResult::origConsumerOperand
OpOperand * origConsumerOperand
Definition: TileUsingInterface.h:325

mlir::scf::SCFFuseConsumerOfSliceResult::tiledOps
SmallVector< Operation * > tiledOps
Definition: TileUsingInterface.h:328

mlir::scf::SCFFuseConsumerOfSliceResult::tiledAndFusedConsumerOperand
OpOperand * tiledAndFusedConsumerOperand
Definition: TileUsingInterface.h:327

mlir::scf::SCFFuseProducerOfSliceResult
Fuse the producer of the source of candidateSliceOp by computing the required slice of the producer i...
Definition: TileUsingInterface.h:203

mlir::scf::SCFFuseProducerOfSliceResult::tiledAndFusedProducer
Value tiledAndFusedProducer
Definition: TileUsingInterface.h:205

mlir::scf::SCFFuseProducerOfSliceResult::generatedSlices
SmallVector< Operation * > generatedSlices
Definition: TileUsingInterface.h:207

mlir::scf::SCFFuseProducerOfSliceResult::origProducer
OpResult origProducer
Definition: TileUsingInterface.h:204

mlir::scf::SCFFuseProducerOfSliceResult::tiledOps
SmallVector< Operation * > tiledOps
Definition: TileUsingInterface.h:206

mlir::scf::SCFTileAndFuseOptions::ControlFnResult
Control function to check if a slice needs to be fused or not, The control function receives 1) the s...
Definition: TileUsingInterface.h:174

mlir::scf::SCFTileAndFuseOptions::ControlFnResult::yieldProducerReplacement
bool yieldProducerReplacement
Set to true if the loop nest has to return a replacement value for the fused producer.
Definition: TileUsingInterface.h:177

mlir::scf::SCFTileAndFuseOptions
Options used to control tile + fuse.
Definition: TileUsingInterface.h:157

mlir::scf::SCFTileAndFuseOptions::tilingOptions
SCFTilingOptions tilingOptions
The tiling options used to control the tiling of the consumer.
Definition: TileUsingInterface.h:159

mlir::scf::SCFTileAndFuseOptions::cleanupPatterns
std::optional< FrozenRewritePatternSet > cleanupPatterns
An optional set of rewrite patterns to apply to the results of tiling before fusion.
Definition: TileUsingInterface.h:196

mlir::scf::SCFTileAndFuseOptions::setTilingOptions
SCFTileAndFuseOptions & setTilingOptions(SCFTilingOptions options)
Definition: TileUsingInterface.h:160

mlir::scf::SCFTileAndFuseOptions::fusionControlFn
ControlFnTy fusionControlFn
The default control function implements greedy fusion without yielding a replacement for any of the f...
Definition: TileUsingInterface.h:184

mlir::scf::SCFTileAndFuseOptions::ControlFnTy
std::function< std::optional< ControlFnResult >(tensor::ExtractSliceOp candidateSliceOp, OpResult originalProducer, bool isDestinationOperand)> ControlFnTy
Definition: TileUsingInterface.h:181

mlir::scf::SCFTileAndFuseOptions::setFusionControlFn
SCFTileAndFuseOptions & setFusionControlFn(ControlFnTy controlFn)
Definition: TileUsingInterface.h:188

mlir::scf::SCFTileAndFuseResult
Transformation information returned after tile and fuse.
Definition: TileUsingInterface.h:277

mlir::scf::SCFTileAndFuseResult::loops
SmallVector< LoopLikeOpInterface > loops
The scf.for operations that iterate over the tiles.
Definition: TileUsingInterface.h:285

mlir::scf::SCFTileAndFuseResult::fusedProducers
llvm::SetVector< Operation * > fusedProducers
List of untiled operations that were fused with the tiled consumer.
Definition: TileUsingInterface.h:279

mlir::scf::SCFTileAndFuseResult::replacements
llvm::DenseMap< Value, Value > replacements
The replacement values to use for the tiled and fused operations.
Definition: TileUsingInterface.h:287

mlir::scf::SCFTileAndFuseResult::tiledAndFusedOps
llvm::SetVector< Operation * > tiledAndFusedOps
List of tiled and fused operations generated.
Definition: TileUsingInterface.h:283

mlir::scf::SCFTilingOptions
Options to use to control tiling.
Definition: TileUsingInterface.h:35

mlir::scf::SCFTilingOptions::tileSizeComputationFunction
SCFTileSizeComputationFunction tileSizeComputationFunction
Computation function that returns the tile sizes to use for each loop.
Definition: TileUsingInterface.h:41

mlir::scf::SCFTilingOptions::setTileSizeComputationFunction
SCFTilingOptions & setTileSizeComputationFunction(SCFTileSizeComputationFunction fun)
Definition: TileUsingInterface.h:44

mlir::scf::SCFTilingOptions::setReductionTilingStrategy
SCFTilingOptions & setReductionTilingStrategy(ReductionTilingStrategy strategy)
Definition: TileUsingInterface.h:113

mlir::scf::SCFTilingOptions::loopType
LoopType loopType
Definition: TileUsingInterface.h:82

mlir::scf::SCFTilingOptions::setNumThreadsComputationFunction
SCFTilingOptions & setNumThreadsComputationFunction(SCFTileSizeComputationFunction fun)
Definition: TileUsingInterface.h:65

mlir::scf::SCFTilingOptions::setNumThreads
SCFTilingOptions & setNumThreads(ArrayRef< OpFoldResult > numThreads)
Convenience function to set the numThreadsComputationFunction to a function that computes num threads...
Definition: TileUsingInterface.cpp:51

mlir::scf::SCFTilingOptions::setInterchange
SCFTilingOptions & setInterchange(ArrayRef< int64_t > interchange)
Definition: TileUsingInterface.h:75

mlir::scf::SCFTilingOptions::setTileSizes
SCFTilingOptions & setTileSizes(ArrayRef< OpFoldResult > tileSizes)
Convenience function to set the tileSizeComputationFunction to a function that computes tile sizes at...
Definition: TileUsingInterface.cpp:41

mlir::scf::SCFTilingOptions::numThreadsComputationFunction
SCFTileSizeComputationFunction numThreadsComputationFunction
Computation function that returns the number of threads to use for each loop.
Definition: TileUsingInterface.h:62

mlir::scf::SCFTilingOptions::ReductionTilingStrategy
ReductionTilingStrategy
Specify how reduction dimensions should be tiled.
Definition: TileUsingInterface.h:99

mlir::scf::SCFTilingOptions::ReductionTilingStrategy::FullReduction
@ FullReduction

mlir::scf::SCFTilingOptions::ReductionTilingStrategy::PartialReductionOuterReduction
@ PartialReductionOuterReduction

mlir::scf::SCFTilingOptions::ReductionTilingStrategy::PartialReductionOuterParallel
@ PartialReductionOuterParallel

mlir::scf::SCFTilingOptions::interchangeVector
SmallVector< int64_t > interchangeVector
The interchange vector to reorder the tiled loops.
Definition: TileUsingInterface.h:74

mlir::scf::SCFTilingOptions::LoopType
LoopType
Specify which loop construct to use for tile and fuse.
Definition: TileUsingInterface.h:81

mlir::scf::SCFTilingOptions::LoopType::ForallOp
@ ForallOp

mlir::scf::SCFTilingOptions::LoopType::ForOp
@ ForOp

mlir::scf::SCFTilingOptions::mappingVector
SmallVector< Attribute > mappingVector
Specify mapping of loops to devices.
Definition: TileUsingInterface.h:122

mlir::scf::SCFTilingOptions::setLoopType
SCFTilingOptions & setLoopType(LoopType type)
Definition: TileUsingInterface.h:83

mlir::scf::SCFTilingOptions::setMapping
SCFTilingOptions & setMapping(ArrayRef< Attribute > mapping)
Definition: TileUsingInterface.h:123

mlir::scf::SCFTilingOptions::reductionStrategy
ReductionTilingStrategy reductionStrategy
Definition: TileUsingInterface.h:110

mlir::scf::SCFTilingResult
Transformation information returned after tiling.
Definition: TileUsingInterface.h:130

mlir::scf::SCFTilingResult::tiledOps
SmallVector< Operation * > tiledOps
Tiled operations that are generated during tiling.
Definition: TileUsingInterface.h:134

mlir::scf::SCFTilingResult::initialValues
SmallVector< Value > initialValues
The initial destination values passed to the tiled operations.
Definition: TileUsingInterface.h:136

mlir::scf::SCFTilingResult::loops
SmallVector< LoopLikeOpInterface > loops
The scf.for operations that iterate over the tiles.
Definition: TileUsingInterface.h:138

mlir::scf::SCFTilingResult::mergeResult
MergeResult mergeResult
The result generated by the loop nest in tiling, may hold partial results, which need to be merged to...
Definition: TileUsingInterface.h:144

mlir::scf::SCFTilingResult::generatedSlices
SmallVector< Operation * > generatedSlices
Slices generated after tiling that can be used for fusing with the tiled producer.
Definition: TileUsingInterface.h:147