doxygen/Dialect_2SCF_2Utils_2Utils_8h_source.html

 //===- Utils.h - SCF dialect utilities --------------------------*- C++ -*-===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//

 //

 // This header file defines prototypes for various SCF utilities.

 //

 //===----------------------------------------------------------------------===//


 #ifndef MLIR_DIALECT_SCF_UTILS_UTILS_H_

 #define MLIR_DIALECT_SCF_UTILS_UTILS_H_


 #include "mlir/Dialect/SCF/IR/SCF.h"

 #include "mlir/IR/PatternMatch.h"

 #include "mlir/Support/LLVM.h"

 #include "llvm/ADT/STLExtras.h"

 #include <optional>


 namespace mlir {

 class Location;

 class Operation;

 class OpBuilder;

 class Region;

 class RewriterBase;

 class ValueRange;

 class Value;


 namespace func {

 class CallOp;

 class FuncOp;

 } // namespace func


 /// Update a perfectly nested loop nest to yield new values from the innermost

 /// loop and propagating it up through the loop nest. This function

 /// - Expects `loopNest` to be a perfectly nested loop with outer most loop

 ///   first and innermost loop last.

 /// - `newIterOperands` are the initialization values to be used for the

 ///    outermost loop

 /// - `newYielValueFn` is the callback that generates the new values to be

 ///   yielded from within the innermost loop.

 /// - The original loops are not erased,  but are left in a "no-op" state where

 ///   the body of the loop just yields the basic block arguments that correspond

 ///   to the initialization values of a loop. The original loops are dead after

 ///   this method.

 /// - If `replaceIterOperandsUsesInLoop` is true, all uses of the

 ///   `newIterOperands` within the generated new loop are replaced with the

 ///   corresponding `BlockArgument` in the loop body.

 SmallVector<scf::ForOp> replaceLoopNestWithNewYields(

     RewriterBase &rewriter, MutableArrayRef<scf::ForOp> loopNest,

     ValueRange newIterOperands, const NewYieldValuesFn &newYieldValuesFn,

     bool replaceIterOperandsUsesInLoop = true);


 /// Outline a region with a single block into a new FuncOp.

 /// Assumes the FuncOp result types is the type of the yielded operands of the

 /// single block. This constraint makes it easy to determine the result.

 /// This method also clones the `arith::ConstantIndexOp` at the start of

 /// `outlinedFuncBody` to alloc simple canonicalizations.

 /// Creates a new FuncOp and thus cannot be used in a FuncOp pass.

 /// The client is responsible for providing a unique `funcName` that will not

 /// collide with another FuncOp name.  If `callOp` is provided, it will be set

 /// to point to the operation that calls the outlined function.

 // TODO: support more than single-block regions.

 // TODO: more flexible constant handling.

 FailureOr<func::FuncOp>

 outlineSingleBlockRegion(RewriterBase &rewriter, Location loc, Region &region,

                          StringRef funcName, func::CallOp *callOp = nullptr);


 /// Outline the then and/or else regions of `ifOp` as follows:

 ///  - if `thenFn` is not null, `thenFnName` must be specified and the `then`

 ///    region is inlined into a new FuncOp that is captured by the pointer.

 ///  - if `elseFn` is not null, `elseFnName` must be specified and the `else`

 ///    region is inlined into a new FuncOp that is captured by the pointer.

 /// Creates new FuncOps and thus cannot be used in a FuncOp pass.

 /// The client is responsible for providing a unique `thenFnName`/`elseFnName`

 /// that will not collide with another FuncOp name.

 LogicalResult outlineIfOp(RewriterBase &b, scf::IfOp ifOp, func::FuncOp *thenFn,

                           StringRef thenFnName, func::FuncOp *elseFn,

                           StringRef elseFnName);


 /// Get a list of innermost parallel loops contained in `rootOp`. Innermost

 /// parallel loops are those that do not contain further parallel loops

 /// themselves.

 bool getInnermostParallelLoops(Operation *rootOp,

                                SmallVectorImpl<scf::ParallelOp> &result);


 /// Return the min/max expressions for `value` if it is an induction variable

 /// from scf.for or scf.parallel loop.

 /// if `loopFilter` is passed, the filter determines which loop to consider.

 /// Other induction variables are ignored.

 std::optional<std::pair<AffineExpr, AffineExpr>>

 getSCFMinMaxExpr(Value value, SmallVectorImpl<Value> &dims,

                  SmallVectorImpl<Value> &symbols,

                  llvm::function_ref<bool(Operation *)> loopFilter = nullptr);


 /// Replace a perfect nest of "for" loops with a single linearized loop. Assumes

 /// `loops` contains a list of perfectly nested loops with bounds and steps

 /// independent of any loop induction variable involved in the nest.

 LogicalResult coalesceLoops(MutableArrayRef<scf::ForOp> loops);

 LogicalResult coalesceLoops(RewriterBase &rewriter,

                             MutableArrayRef<scf::ForOp>);


 /// Walk an affine.for to find a band to coalesce.

 LogicalResult coalescePerfectlyNestedSCFForLoops(scf::ForOp op);


 /// Take the ParallelLoop and for each set of dimension indices, combine them

 /// into a single dimension. combinedDimensions must contain each index into

 /// loops exactly once.

 void collapseParallelLoops(RewriterBase &rewriter, scf::ParallelOp loops,

                            ArrayRef<std::vector<unsigned>> combinedDimensions);


 struct UnrolledLoopInfo {

   std::optional<scf::ForOp> mainLoopOp = std::nullopt;

   std::optional<scf::ForOp> epilogueLoopOp = std::nullopt;

 };


 /// Unrolls this for operation by the specified unroll factor. Returns the

 /// unrolled main loop and the epilogue loop, if the loop is unrolled. Otherwise

 /// returns failure if the loop cannot be unrolled either due to restrictions or

 /// due to invalid unroll factors. Requires positive loop bounds and step. If

 /// specified, annotates the Ops in each unrolled iteration by applying

 /// `annotateFn`.

 FailureOr<UnrolledLoopInfo> loopUnrollByFactor(

     scf::ForOp forOp, uint64_t unrollFactor,

     function_ref<void(unsigned, Operation *, OpBuilder)> annotateFn = nullptr);


 /// Unrolls this loop completely.

 LogicalResult loopUnrollFull(scf::ForOp forOp);


 /// Unrolls and jams this `scf.for` operation by the specified unroll factor.

 /// Returns failure if the loop cannot be unrolled either due to restrictions or

 /// due to invalid unroll factors. In case of unroll factor of 1, the function

 /// bails out without doing anything (returns success). Currently, only constant

 /// trip count that are divided by the unroll factor is supported. Currently,

 /// for operations with results are not supported.

 LogicalResult loopUnrollJamByFactor(scf::ForOp forOp, uint64_t unrollFactor);


 /// Materialize bounds and step of a zero-based and unit-step loop derived by

 /// normalizing the specified bounds and step.

 Range emitNormalizedLoopBounds(RewriterBase &rewriter, Location loc,

                                OpFoldResult lb, OpFoldResult ub,

                                OpFoldResult step);


 /// Get back the original induction variable values after loop normalization.

 void denormalizeInductionVariable(RewriterBase &rewriter, Location loc,

                                   Value normalizedIv, OpFoldResult origLb,

                                   OpFoldResult origStep);


 /// Tile a nest of standard for loops rooted at `rootForOp` by finding such

 /// parametric tile sizes that the outer loops have a fixed number of iterations

 /// as defined in `sizes`.

 using Loops = SmallVector<scf::ForOp, 8>;

 using TileLoops = std::pair<Loops, Loops>;

 TileLoops extractFixedOuterLoops(scf::ForOp rootFOrOp, ArrayRef<int64_t> sizes);


 /// Performs tiling fo imperfectly nested loops (with interchange) by

 /// strip-mining the `forOps` by `sizes` and sinking them, in their order of

 /// occurrence in `forOps`, under each of the `targets`.

 /// Returns the new AffineForOps, one per each of (`forOps`, `targets`) pair,

 /// nested immediately under each of `targets`.

 SmallVector<Loops, 8> tile(ArrayRef<scf::ForOp> forOps, ArrayRef<Value> sizes,

                            ArrayRef<scf::ForOp> targets);


 /// Performs tiling (with interchange) by strip-mining the `forOps` by `sizes`

 /// and sinking them, in their order of occurrence in `forOps`, under `target`.

 /// Returns the new AffineForOps, one per `forOps`, nested immediately under

 /// `target`.

 Loops tile(ArrayRef<scf::ForOp> forOps, ArrayRef<Value> sizes,

            scf::ForOp target);


 /// Tile a nest of scf::ForOp loops rooted at `rootForOp` with the given

 /// (parametric) sizes. Sizes are expected to be strictly positive values at

 /// runtime.  If more sizes than loops are provided, discard the trailing values

 /// in sizes.  Assumes the loop nest is permutable.

 /// Returns the newly created intra-tile loops.

 Loops tilePerfectlyNested(scf::ForOp rootForOp, ArrayRef<Value> sizes);


 /// Get perfectly nested sequence of loops starting at root of loop nest

 /// (the first op being another AffineFor, and the second op - a terminator).

 /// A loop is perfectly nested iff: the first op in the loop's body is another

 /// AffineForOp, and the second op is a terminator).

 void getPerfectlyNestedLoops(SmallVectorImpl<scf::ForOp> &nestedLoops,

                              scf::ForOp root);


 /// Given two scf.forall loops, `target` and `source`, fuses `target` into

 /// `source`. Assumes that the given loops are siblings and are independent of

 /// each other.

 ///

 /// This function does not perform any legality checks and simply fuses the

 /// loops. The caller is responsible for ensuring that the loops are legal to

 /// fuse.

 scf::ForallOp fuseIndependentSiblingForallLoops(scf::ForallOp target,

                                                 scf::ForallOp source,

                                                 RewriterBase &rewriter);


 /// Given two scf.for loops, `target` and `source`, fuses `target` into

 /// `source`. Assumes that the given loops are siblings and are independent of

 /// each other.

 ///

 /// This function does not perform any legality checks and simply fuses the

 /// loops. The caller is responsible for ensuring that the loops are legal to

 /// fuse.

 scf::ForOp fuseIndependentSiblingForLoops(scf::ForOp target, scf::ForOp source,

                                           RewriterBase &rewriter);


 /// Normalize an `scf.forall` operation. Returns `failure()`if normalization

 /// fails.

 // On `success()` returns the

 /// newly created operation with all uses of the original operation replaced

 /// with results of the new operation.

 FailureOr<scf::ForallOp> normalizeForallOp(RewriterBase &rewriter,

                                            scf::ForallOp forallOp);


 } // namespace mlir


 #endif // MLIR_DIALECT_SCF_UTILS_UTILS_H_

PatternMatch.h

llvm::ArrayRef
Definition: LLVM.h:48

llvm::MutableArrayRef
Definition: LLVM.h:62

llvm::SmallVectorImpl
Definition: LLVM.h:74

llvm::SmallVector
Definition: LLVM.h:72

llvm::function_ref
Definition: LLVM.h:90

mlir::Location
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
Definition: Location.h:76

mlir::OpBuilder
This class helps build Operations.
Definition: Builders.h:204

mlir::OpFoldResult
This class represents a single result from folding an operation.
Definition: OpDefinition.h:271

mlir::Operation
Operation is the basic unit of execution within MLIR.
Definition: Operation.h:88

mlir::RewriterBase
This class coordinates the application of a rewrite on a set of IR, providing a way for clients to tr...
Definition: PatternMatch.h:358

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

SCF.h

LLVM.h

mlir::lsp::CompletionItemKind::Value
@ Value

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::getPerfectlyNestedLoops
void getPerfectlyNestedLoops(SmallVectorImpl< scf::ForOp > &nestedLoops, scf::ForOp root)
Get perfectly nested sequence of loops starting at root of loop nest (the first op being another Affi...
Definition: Utils.cpp:1330

mlir::outlineIfOp
LogicalResult outlineIfOp(RewriterBase &b, scf::IfOp ifOp, func::FuncOp *thenFn, StringRef thenFnName, func::FuncOp *elseFn, StringRef elseFnName)
Outline the then and/or else regions of ifOp as follows:
Definition: Utils.cpp:223

mlir::replaceLoopNestWithNewYields
SmallVector< scf::ForOp > replaceLoopNestWithNewYields(RewriterBase &rewriter, MutableArrayRef< scf::ForOp > loopNest, ValueRange newIterOperands, const NewYieldValuesFn &newYieldValuesFn, bool replaceIterOperandsUsesInLoop=true)
Update a perfectly nested loop nest to yield new values from the innermost loop and propagating it up...
Definition: Utils.cpp:40

mlir::coalescePerfectlyNestedSCFForLoops
LogicalResult coalescePerfectlyNestedSCFForLoops(scf::ForOp op)
Walk an affine.for to find a band to coalesce.
Definition: Utils.cpp:1001

mlir::TileLoops
std::pair< Loops, Loops > TileLoops
Definition: Utils.h:155

mlir::loopUnrollFull
LogicalResult loopUnrollFull(scf::ForOp forOp)
Unrolls this loop completely.
Definition: Utils.cpp:502

mlir::collapseParallelLoops
void collapseParallelLoops(RewriterBase &rewriter, scf::ParallelOp loops, ArrayRef< std::vector< unsigned >> combinedDimensions)
Take the ParallelLoop and for each set of dimension indices, combine them into a single dimension.
Definition: Utils.cpp:1076

mlir::NewYieldValuesFn
std::function< SmallVector< Value >(OpBuilder &b, Location loc, ArrayRef< BlockArgument > newBbArgs)> NewYieldValuesFn
A function that returns the additional yielded values during replaceWithAdditionalYields.
Definition: LoopLikeInterface.h:26

mlir::tilePerfectlyNested
Loops tilePerfectlyNested(scf::ForOp rootForOp, ArrayRef< Value > sizes)
Tile a nest of scf::ForOp loops rooted at rootForOp with the given (parametric) sizes.
Definition: Utils.cpp:1318

mlir::loopUnrollByFactor
FailureOr< UnrolledLoopInfo > loopUnrollByFactor(scf::ForOp forOp, uint64_t unrollFactor, function_ref< void(unsigned, Operation *, OpBuilder)> annotateFn=nullptr)
Unrolls this for operation by the specified unroll factor.
Definition: Utils.cpp:378

mlir::loopUnrollJamByFactor
LogicalResult loopUnrollJamByFactor(scf::ForOp forOp, uint64_t unrollFactor)
Unrolls and jams this scf.for operation by the specified unroll factor.
Definition: Utils.cpp:530

mlir::getInnermostParallelLoops
bool getInnermostParallelLoops(Operation *rootOp, SmallVectorImpl< scf::ParallelOp > &result)
Get a list of innermost parallel loops contained in rootOp.
Definition: Utils.cpp:246

mlir::tile
SmallVector< Loops, 8 > tile(ArrayRef< scf::ForOp > forOps, ArrayRef< Value > sizes, ArrayRef< scf::ForOp > targets)
Performs tiling fo imperfectly nested loops (with interchange) by strip-mining the forOps by sizes an...
Definition: Utils.cpp:1297

mlir::getSCFMinMaxExpr
std::optional< std::pair< AffineExpr, AffineExpr > > getSCFMinMaxExpr(Value value, SmallVectorImpl< Value > &dims, SmallVectorImpl< Value > &symbols, llvm::function_ref< bool(Operation *)> loopFilter=nullptr)
Return the min/max expressions for value if it is an induction variable from scf.for or scf....

mlir::outlineSingleBlockRegion
FailureOr< func::FuncOp > outlineSingleBlockRegion(RewriterBase &rewriter, Location loc, Region &region, StringRef funcName, func::CallOp *callOp=nullptr)
Outline a region with a single block into a new FuncOp.
Definition: Utils.cpp:119

mlir::denormalizeInductionVariable
void denormalizeInductionVariable(RewriterBase &rewriter, Location loc, Value normalizedIv, OpFoldResult origLb, OpFoldResult origStep)
Get back the original induction variable values after loop normalization.
Definition: Utils.cpp:779

mlir::fuseIndependentSiblingForallLoops
scf::ForallOp fuseIndependentSiblingForallLoops(scf::ForallOp target, scf::ForallOp source, RewriterBase &rewriter)
Given two scf.forall loops, target and source, fuses target into source.
Definition: Utils.cpp:1377

mlir::coalesceLoops
LogicalResult coalesceLoops(MutableArrayRef< scf::ForOp > loops)
Replace a perfect nest of "for" loops with a single linearized loop.
Definition: Utils.cpp:993

mlir::fuseIndependentSiblingForLoops
scf::ForOp fuseIndependentSiblingForLoops(scf::ForOp target, scf::ForOp source, RewriterBase &rewriter)
Given two scf.for loops, target and source, fuses target into source.
Definition: Utils.cpp:1429

mlir::extractFixedOuterLoops
TileLoops extractFixedOuterLoops(scf::ForOp rootFOrOp, ArrayRef< int64_t > sizes)
Definition: Utils.cpp:1335

mlir::emitNormalizedLoopBounds
Range emitNormalizedLoopBounds(RewriterBase &rewriter, Location loc, OpFoldResult lb, OpFoldResult ub, OpFoldResult step)
Materialize bounds and step of a zero-based and unit-step loop derived by normalizing the specified b...
Definition: Utils.cpp:708

mlir::normalizeForallOp
FailureOr< scf::ForallOp > normalizeForallOp(RewriterBase &rewriter, scf::ForallOp forallOp)
Normalize an scf.forall operation.
Definition: Utils.cpp:1479

mlir::Range
Represents a range (offset, size, and stride) where each element of the triple may be dynamic or stat...
Definition: StaticValueUtils.h:35

mlir::UnrolledLoopInfo
Definition: Utils.h:114

mlir::UnrolledLoopInfo::epilogueLoopOp
std::optional< scf::ForOp > epilogueLoopOp
Definition: Utils.h:116

mlir::UnrolledLoopInfo::mainLoopOp
std::optional< scf::ForOp > mainLoopOp
Definition: Utils.h:115