doxygen/include_2mlir_2Dialect_2Linalg_2Utils_2Utils_8h_source.html

//===- Utils.h - Utilities to support the Linalg dialect --------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//


#ifndef MLIR_DIALECT_LINALG_UTILS_UTILS_H

#define MLIR_DIALECT_LINALG_UTILS_UTILS_H


#include "mlir/Dialect/Linalg/IR/Linalg.h"

#include "mlir/Dialect/SCF/IR/SCF.h"

#include "mlir/Dialect/Utils/StructuredOpsUtils.h"

#include "llvm/ADT/StringSet.h"

#include <optional>


namespace mlir {

class AffineExpr;

class AffineMap;

class PatternRewriter;


namespace affine {

class AffineForOp;

} // namespace affine


namespace tensor {

class ExtractSliceOp;

} // namespace tensor


namespace linalg {


//===----------------------------------------------------------------------===//

// Utilities for inferring various semantics properties of Linalg ops.

//===----------------------------------------------------------------------===//


/// Compute inverse permutation for the destination tensor (i.e. in the packed

/// domain).

SmallVector<int64_t> getPackInverseDestPerm(linalg::PackOp packOp,

                                            PackingMetadata &metadata);


/// Compute inverse permutation for the source tensor (i.e. in the packed

/// domain).

SmallVector<int64_t> getUnPackInverseSrcPerm(linalg::UnPackOp,

                                             PackingMetadata &metadata);


//===----------------------------------------------------------------------===//

// General utilities

//===----------------------------------------------------------------------===//


/// Check if all indexing maps are projected permutations.

bool allIndexingsAreProjectedPermutation(LinalgOp op);


/// Detect whether `r` has only ConstantOp, ElementwiseMappable and YieldOp.

bool hasOnlyScalarElementwiseOp(Region &r);


/// Check if a LinalgOp is an element-wise operation.

bool isElementwise(LinalgOp op);


/// Check if iterator type has "parallel" semantics.

bool isParallelIterator(utils::IteratorType iteratorType);


/// Check if iterator type  has "reduction" semantics.

bool isReductionIterator(utils::IteratorType iteratorType);


/// Create a tensor::PadOp that pads `source` to the shape of `type` whose sizes

/// are assumed to be greater than the dynamic `source` size. If `typeDynDims`

/// is specified, then it must contain the sizes of all the dynamic dimensions

/// in order of appearance in `type`, otherwise the function will pad those

/// values to `0`. The padding introduces trailing `pad` values until the target

/// size is met. If `source` is defined by one or more LinalgOps that have been

/// padded with the same  value and sizes, return their padded result instead of

/// creating a tensor::PadOp.

///

/// Example:

/// ```

/// %0 = tensor.extract_slice %arg0 [%iv0, %iv1] [%sz0, %sz1]

/// %1 = tensor.pad %0 low[0, 0] high[...] { tensor.yield %cst }

/// %2 = linalg.matmul ins(...) outs(%1)

/// %3 = tensor.extract_slice %2 [0, 0] [%sz0, %sz1]

/// ```

/// makeComposedPadHighOp(source=%3, pad=%cst) returns %2

/// makeComposedPadHighOp(source=%3, pad=%other_cst) returns %4

/// ```

/// %4 = tensor.pad %3 low[0, 0] high[...] { tensor.yield %other_cst }

/// ```

Value makeComposedPadHighOp(OpBuilder &b, Location loc, RankedTensorType type,

                            Value source, Value padding, bool nofold,

                            ValueRange typeDynDims = {});


/// Returns GenericOp that copies an n-D memref. Unlike the current

/// implementation of memref::CopyOp, this op can further tile, lower to loops

/// or vectorize.

GenericOp makeMemRefCopyOp(OpBuilder &b, Location loc, Value from, Value to);


/// Get the reassociation maps to fold the result of a extract_slice (or

/// source of a insert_slice) operation with given offsets, and sizes to its

/// rank-reduced version. This is only done for the cases where the size is 1

/// and offset is 0. Strictly speaking the offset 0 is not required in

/// general, but non-zero offsets are not handled by SPIR-V backend at this

/// point (and potentially cannot be handled).

std::optional<SmallVector<ReassociationIndices>>

getReassociationMapForFoldingUnitDims(ArrayRef<OpFoldResult> mixedSizes);


//===----------------------------------------------------------------------===//

// Convolution matcher utility

//===----------------------------------------------------------------------===//


/// A struct containing dilations and strides inferred from convolution ops.


struct DilationsAndStrides {

  SmallVector<int64_t> dilations;

  SmallVector<int64_t> strides;

};


/// Given a linalg `op` this function returns DilationsAndStrides if it is a

/// convolution op of type `ConvOpTy`, otherwise returns std::nullopt. The

/// dilations and strides are inferred from the indexing maps. For ops like

/// Conv1DOp, Conv2DOp and Conv3DOp that have no strides/dilations attributes,

/// defaults of [1, ...] are returned for both.

template <typename ConvOpTy>

std::optional<DilationsAndStrides> matchConvolutionOpOfType(LinalgOp op);


/// Returns true if the linalg `op` is a convolution op of type `ConvOpTy`.

/// This is a convenience wrapper around matchConvolutionOpOfType.

template <typename ConvOpTy>


bool isaConvolutionOpOfType(LinalgOp op) {

  return matchConvolutionOpOfType<ConvOpTy>(op).has_value();

}


//===----------------------------------------------------------------------===//

// Fusion / Tiling utilities

//===----------------------------------------------------------------------===//


/// The type of loops to be generated during tiling.


enum class LinalgTilingLoopType {

  Loops = 0,

  AffineLoops = 1,

  ParallelLoops = 2

};


/// Computes tile offsets, given a list of loop `ivs` and `tileSizes`. In case

/// a tile size is zero (i.e., no tiling), the corresponding offset is also

/// zero.

SmallVector<OpFoldResult> computeTileOffsets(OpBuilder &b, Location loc,

                                             ArrayRef<OpFoldResult> ivs,

                                             ArrayRef<OpFoldResult> tileSizes);


/// Computes tile sizes, given a list of `tileSizes` and dimension

/// sizes (`sizeBounds`). In case a tile size is zero (i.e., no tiling), the

/// corresponding result size is the corresponding value from `sizeBounds`.

/// Note: The returned tile sizes are closed intervals.

SmallVector<OpFoldResult> computeTileSizes(OpBuilder &b, Location loc,

                                           ArrayRef<OpFoldResult> tileSizes,

                                           ArrayRef<OpFoldResult> sizeBounds);


/// Returns the list of tensor output types produced when the given structured

/// operation `op` is applied to the given `operands`. Note that `operands`

/// are not necessarily the actual operands of `op`.

SmallVector<Type> getTensorOutputTypes(LinalgOp op, ValueRange operands);


/// Creates `insert_slice` ops that insert `results` back into larger tensors

/// they were originally extracted from with `extract_slice` before being

/// passed as `operands` to the given structured operation `op` or its clone.

/// Note that `operands` are not necessarily the actual operands of `op`, the

/// operation serves only as metadata container for operand types and

/// positions.

SmallVector<Value> insertSlicesBack(OpBuilder &builder, Location loc,

                                    LinalgOp op, ValueRange operands,

                                    ValueRange results);


/// A struct containg offsets-sizes-strides arguments of the tiled shape.


struct SliceParameters {

  SmallVector<OpFoldResult> offsets;

  SmallVector<OpFoldResult> sizes;

  SmallVector<OpFoldResult> strides;

};


/// Computes SliceParameters for a single `valueToTile` assuming that its user

/// is being tiled with the given loop bounds `lbs` and `ubs` and the tile

/// sizes `tileSizes`.

///

/// `omitPartialTileCheck` controls whether to omit the partial/boundary tile

/// condition check in cases where we statically know that it is unnecessary.

SliceParameters

computeSliceParameters(OpBuilder &builder, Location loc, Value valueToTile,

                       ArrayRef<OpFoldResult> tileSizes, AffineMap map,

                       ArrayRef<OpFoldResult> lbs, ArrayRef<OpFoldResult> ubs,

                       ArrayRef<OpFoldResult> subShapeSizes,

                       bool omitPartialTileCheck);


/// Computes SliceParamaters for all `valuesToTile` of the given `linalgOp`,

/// assuming `linalgOp` is being fused into a loop nest. Calls

/// `computeSliceParameters` for every individual value.

///

/// Note that a constant zero in `tileSizes` means no tiling at that implicit

/// loop. The number of non-zero values in `tileSizes` should be equal to the

/// number of values in `ivs`.

///

/// Some of the `valuesToTile` won't be affected by tiling. For these values,

/// std::nullopt will be returned.

SmallVector<std::optional<SliceParameters>>

computeAllSliceParameters(OpBuilder &builder, Location loc, LinalgOp linalgOp,

                          ValueRange valuesToTile, ArrayRef<OpFoldResult> ivs,

                          ArrayRef<OpFoldResult> tileSizes,

                          ArrayRef<OpFoldResult> sizeBounds,

                          bool omitPartialTileCheck);


/// Creates an extract_slice/subview op for a single `valueToTile` with

/// `builder`. This new operation extracts a tile of `valueToTile`, starting

/// at offsets `lbs` and with sizes `subShapeSizes`. `omitPartialTileCheck`

/// controls whether to omit the partial/boundary tile condition check in

/// cases where we statically know that it is unnecessary.

Operation *makeTiledShape(OpBuilder &builder, Location loc, Value valueToTile,

                          ArrayRef<OpFoldResult> tileSizes, AffineMap map,

                          ArrayRef<OpFoldResult> lbs,

                          ArrayRef<OpFoldResult> ubs,

                          ArrayRef<OpFoldResult> subShapeSizes,

                          bool omitPartialTileCheck);


/// Creates extract_slice/subview ops for all `valuesToTile` of the given

/// `linalgOp` with `builder`, assuming `linalgOp` is being fused into a loop

/// nest for tiling with the given induction variables `ivs` and tile sizes

/// `tileSizes`. `sizeBounds` are the iteration space bounds for *all* the

/// implicit loops in `linalgOp`. `omitPartialTileCheck` controls whether to

/// omit the partial/boundary tile condition check in cases where we

/// statically know that it is unnecessary.

///

/// Note that a constant zero in `tileSizes` means no tiling at that implicit

/// loop. The number of non-zero values in `tileSizes` should be equal to the

/// number of values in `ivs`.

SmallVector<Value> makeTiledShapes(OpBuilder &builder, Location loc,

                                   LinalgOp linalgOp, ValueRange valuesToTile,

                                   ArrayRef<OpFoldResult> ivs,

                                   ArrayRef<OpFoldResult> tileSizes,

                                   ArrayRef<OpFoldResult> sizeBounds,

                                   bool omitPartialTileCheck);


/// Add the specified offsets to any `linalg.index` ops contained in the given

/// `linalgOp`. The offsets are provided in the same order as iteration space

/// dimensions. Null offests are assumed to be zero.

void offsetIndices(OpBuilder &b, LinalgOp linalgOp,

                   ArrayRef<OpFoldResult> offests);

void offsetIndices(RewriterBase &b, LinalgOp linalgOp,

                   ArrayRef<OpFoldResult> offests);


/// A struct containing the Linalg producer before and after fusion.

/// When operating on tensors, `fusedProducer` may feed into a `tensor.cast`

/// op before the consumer Linalg op, until enough canonicalizations have

/// applied.


struct FusionInfo {

  LinalgOp originalProducer;

  LinalgOp fusedProducer;

};


/// This implements the fusion part of the "tileAndFuse on tensors"

/// transformation and thus requires the `consumerOpOperand` to be a

/// `extract_slice` op (generally obtained by applying the tiling

/// transformation).

FailureOr<FusionInfo> fuseProducerOfTensor(OpBuilder &b,

                                           OpOperand &consumerOpOperand);


/// This implements the fusion part of the "tileAndFuse on tensors"

/// transformation and thus requires the `consumerOpOperand` to be a

/// `extract_slice` op (generally obtained by applying the tiling

/// transformation). Assumes `producerOfTensor` is a Linalg op that produces

/// `consumerOpOperand`.

FailureOr<FusionInfo> fuseProducerOfTensor(OpBuilder &b,

                                           OpResult producerOpResult,

                                           OpOperand &consumerOpOperand);


//===----------------------------------------------------------------------===//

// Distribution utilities

//===----------------------------------------------------------------------===//


/// Scheme used to distribute loops to processors.


enum class DistributionMethod {

  /// Cyclic distribution where no assumption is made about the dynamic

  /// relationship between number of processors and number of iterations of

  /// the

  /// distributed loop. Distributes the following loop

  ///

  /// scf.parallel (%iv) = (%lb) to (%ub) step (%step)

  ///

  /// to

  ///

  /// scf.parallel(%iv)= (%lb + %procId * %step) to (%ub) step (%step *

  /// %nprocs)

  Cyclic = 0,


  /// Cyclic distribution where the number of processors can be assumed to be

  /// more than or equal to the number of iterations of the distributed loop.

  /// In

  /// such cases, a simple in-bounds check is enough (instead of materializing

  /// a

  /// loop). Distributes the following loop

  ///

  /// scf.parallel (%iv) = (%lb) to (%ub) step (%step)

  ///

  /// to

  ///

  /// %iv = %lb + %procId * %step

  /// %cond = arith.cmpi "slt", %iv, %ub

  /// scf.if %cond {

  ///   ...

  /// }

  CyclicNumProcsGeNumIters = 1,


  /// Cyclic distribution where the number of processors can be assumed to be

  ///  equal to the number of iterations of the distributed loop. In such

  ///  cases,

  ///  no bounds check is needed. Distributes the following loop

  ///

  /// scf.parallel (%iv) = (%lb) to (%ub) step (%step)

  ///

  /// to

  ///

  /// %iv = %lb + %procId * %step

  CyclicNumProcsEqNumIters = 2,


  /// No Distribution.

  None = 3

};


/// Callback function type used to get processor ID, and number of processors

/// used for distribution for all parallel loops generated.


struct ProcInfo {

  Value procId;

  Value nprocs;

  DistributionMethod distributionMethod;

};


using ProcInfoCallBackFn = std::function<SmallVector<ProcInfo>(

    OpBuilder &b, Location loc, ArrayRef<Range> parallelLoopRanges)>;


/// Options that allow distribution of loops generated in Linalg transforms to

/// processors while generating the loops.


struct LinalgLoopDistributionOptions {

  /// Callback function that returns the Values for processor ID (`procId`),

  /// and number of processors (`nprocs`) used to execute the parallel loops.

  /// The number of `{procId, nprocs}` pairs returned must be equal to the

  /// number of `parallelLoopRanges` passed into the callback. The

  /// `parallelLoopRanges` are ranges of the outer parallel loops of the

  /// operation that do have non-zero tile sizes specified.

  ProcInfoCallBackFn procInfo;

};


/// Update the `lb`, `ub` and `step` to get per processor `lb`, `ub` and

/// `step`.

void updateBoundsForCyclicDistribution(OpBuilder &builder, Location loc,

                                       Value procId, Value nprocs, Value &lb,

                                       Value &ub, Value &step);


//===----------------------------------------------------------------------===//

// Fusion on tensor utilities

//===----------------------------------------------------------------------===//


//===----------------------------------------------------------------------===//

// Generic op region utilities

//===----------------------------------------------------------------------===//


/// A struct containing common matchers over linalg op's region.


struct RegionMatcher {


  enum class BinaryOpKind {

    IAdd,

  };


  /// Matches the given linalg op if its body is performing binary operation

  /// on int or float scalar values and returns the binary op kind.

  ///

  /// The linalg op's region is expected to be

  /// ```

  /// {

  ///   ^bb(%a: <scalar-type>, %b: <scalar-type>):

  ///     %0 = <binary-op> %a, %b: <scalar-type>

  ///     linalg.yield %0: <scalar-type>

  /// }

  /// ```

  static std::optional<BinaryOpKind> matchAsScalarBinaryOp(GenericOp op);

};


//===----------------------------------------------------------------------===//

// Loop nest utilities

//===----------------------------------------------------------------------===//


/// Utility class used to generate nested loops with ranges described by

/// `loopRanges` and loop type described by the `iteratorTypes`.

/// `bodyBuilderFn` is used to generate the body of the innermost loop. It is

/// passed a range of loop induction variables and a range of operand values

/// to use.

template <typename LoopTy>


struct GenerateLoopNest {

  static void doit(OpBuilder &b, Location loc, ArrayRef<Range> loopRanges,

                   LinalgOp linalgOp,

                   ArrayRef<utils::IteratorType> iteratorTypes,

                   function_ref<scf::ValueVector(OpBuilder &, Location,

                                                 ValueRange, ValueRange)>

                       bodyBuilderFn,

                   ArrayRef<linalg::ProcInfo> procInfo = {});

};


/// Returns an attribute list that excludes pre-defined attributes.

template <typename OpTy>


SmallVector<NamedAttribute> getPrunedAttributeList(OpTy op) {

  auto elidedAttrs = llvm::to_vector(op.getAttributeNames());

  if (isa<linalg::LinalgOp>(op.getOperation()))

    elidedAttrs.push_back(LinalgDialect::kMemoizedIndexingMapsAttrName);

  return getPrunedAttributeList(op, elidedAttrs);

}


} // namespace linalg

} // namespace mlir


#endif // MLIR_DIALECT_LINALG_UTILS_UTILS_H

b
b
Return true if permutation is a valid permutation of the outer_dims_perm (case OuterOrInnerPerm::Oute...
Definition LinalgTransformOps.cpp:2119

StructuredOpsUtils.h

llvm::ArrayRef
Definition LLVM.h:40

llvm::SmallVector
Definition LLVM.h:64

mlir::AffineExpr
Base type for affine expression.
Definition AffineExpr.h:68

mlir::AffineMap
A multi-dimensional affine map Affine map's are immutable like Type's, and they are uniqued.
Definition AffineMap.h:46

mlir::Location
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
Definition Location.h:76

mlir::OpBuilder
This class helps build Operations.
Definition Builders.h:209

mlir::OpOperand
This class represents an operand of an operation.
Definition Value.h:257

mlir::OpResult
This is a value defined by a result of an operation.
Definition Value.h:457

mlir::Operation
Operation is the basic unit of execution within MLIR.
Definition Operation.h:88

mlir::PatternRewriter
A special type of RewriterBase that coordinates the application of a rewrite pattern on the current I...
Definition PatternMatch.h:799

mlir::Region
This class contains a list of basic blocks and a link to the parent operation it is attached to.
Definition Region.h:26

mlir::RewriterBase
This class coordinates the application of a rewrite on a set of IR, providing a way for clients to tr...
Definition PatternMatch.h:368

mlir::ValueRange
This class provides an abstraction over the different types of ranges over Values.
Definition ValueRange.h:387

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition Value.h:96

Linalg.h

SCF.h

mlir::affine
Definition AffineToStandard.h:23

mlir::linalg
Definition LinalgToStandard.h:24

mlir::linalg::fuseProducerOfTensor
FailureOr< FusionInfo > fuseProducerOfTensor(OpBuilder &b, OpOperand &consumerOpOperand)
This implements the fusion part of the "tileAndFuse on tensors" transformation and thus requires the ...
Definition Fusion.cpp:218

mlir::linalg::getUnPackInverseSrcPerm
SmallVector< int64_t > getUnPackInverseSrcPerm(linalg::UnPackOp, PackingMetadata &metadata)
Compute inverse permutation for the source tensor (i.e.

mlir::linalg::makeTiledShapes
SmallVector< Value > makeTiledShapes(OpBuilder &builder, Location loc, LinalgOp linalgOp, ValueRange valuesToTile, ArrayRef< OpFoldResult > ivs, ArrayRef< OpFoldResult > tileSizes, ArrayRef< OpFoldResult > sizeBounds, bool omitPartialTileCheck)
Creates extract_slice/subview ops for all valuesToTile of the given linalgOp with builder,...
Definition Utils.cpp:2850

mlir::linalg::allIndexingsAreProjectedPermutation
bool allIndexingsAreProjectedPermutation(LinalgOp op)
Check if all indexing maps are projected permutations.
Definition Utils.cpp:197

mlir::linalg::isParallelIterator
bool isParallelIterator(utils::IteratorType iteratorType)
Check if iterator type has "parallel" semantics.
Definition Utils.cpp:232

mlir::linalg::computeTileSizes
SmallVector< OpFoldResult > computeTileSizes(OpBuilder &b, Location loc, ArrayRef< OpFoldResult > tileSizes, ArrayRef< OpFoldResult > sizeBounds)
Computes tile sizes, given a list of tileSizes and dimension sizes (sizeBounds).
Definition Utils.cpp:2745

mlir::linalg::matchConvolutionOpOfType
std::optional< DilationsAndStrides > matchConvolutionOpOfType(LinalgOp op)
Given a linalg op this function returns DilationsAndStrides if it is a convolution op of type ConvOpT...

mlir::linalg::makeMemRefCopyOp
GenericOp makeMemRefCopyOp(OpBuilder &b, Location loc, Value from, Value to)
Returns GenericOp that copies an n-D memref.
Definition Utils.cpp:2301

mlir::linalg::computeTileOffsets
SmallVector< OpFoldResult > computeTileOffsets(OpBuilder &b, Location loc, ArrayRef< OpFoldResult > ivs, ArrayRef< OpFoldResult > tileSizes)
Computes tile offsets, given a list of loop ivs and tileSizes.
Definition Utils.cpp:2731

mlir::linalg::LinalgTilingLoopType
LinalgTilingLoopType
The type of loops to be generated during tiling.
Definition Utils.h:135

mlir::linalg::LinalgTilingLoopType::Loops
@ Loops
Definition Utils.h:136

mlir::linalg::LinalgTilingLoopType::AffineLoops
@ AffineLoops
Definition Utils.h:137

mlir::linalg::LinalgTilingLoopType::ParallelLoops
@ ParallelLoops
Definition Utils.h:138

mlir::linalg::isReductionIterator
bool isReductionIterator(utils::IteratorType iteratorType)
Check if iterator type has "reduction" semantics.
Definition Utils.cpp:236

mlir::linalg::hasOnlyScalarElementwiseOp
bool hasOnlyScalarElementwiseOp(Region &r)
Detect whether r has only ConstantOp, ElementwiseMappable and YieldOp.
Definition Utils.cpp:203

mlir::linalg::getReassociationMapForFoldingUnitDims
std::optional< SmallVector< ReassociationIndices > > getReassociationMapForFoldingUnitDims(ArrayRef< OpFoldResult > mixedSizes)
Get the reassociation maps to fold the result of a extract_slice (or source of a insert_slice) operat...
Definition Utils.cpp:2908

mlir::linalg::DistributionMethod
DistributionMethod
Scheme used to distribute loops to processors.
Definition Utils.h:276

mlir::linalg::DistributionMethod::None
@ None
No Distribution.
Definition Utils.h:321

mlir::linalg::DistributionMethod::CyclicNumProcsGeNumIters
@ CyclicNumProcsGeNumIters
Cyclic distribution where the number of processors can be assumed to be more than or equal to the num...
Definition Utils.h:306

mlir::linalg::DistributionMethod::Cyclic
@ Cyclic
Cyclic distribution where no assumption is made about the dynamic relationship between number of proc...
Definition Utils.h:288

mlir::linalg::DistributionMethod::CyclicNumProcsEqNumIters
@ CyclicNumProcsEqNumIters
Cyclic distribution where the number of processors can be assumed to be equal to the number of iterat...
Definition Utils.h:318

mlir::linalg::insertSlicesBack
SmallVector< Value > insertSlicesBack(OpBuilder &builder, Location loc, LinalgOp op, ValueRange operands, ValueRange results)
Creates insert_slice ops that insert results back into larger tensors they were originally extracted ...
Definition Utils.cpp:2770

mlir::linalg::isElementwise
bool isElementwise(LinalgOp op)
Check if a LinalgOp is an element-wise operation.
Definition Utils.cpp:217

mlir::linalg::offsetIndices
void offsetIndices(OpBuilder &b, LinalgOp linalgOp, ArrayRef< OpFoldResult > offests)
Add the specified offsets to any linalg.index ops contained in the given linalgOp.
Definition Utils.cpp:2872

mlir::linalg::getPackInverseDestPerm
SmallVector< int64_t > getPackInverseDestPerm(linalg::PackOp packOp, PackingMetadata &metadata)
Compute inverse permutation for the destination tensor (i.e.

mlir::linalg::isaConvolutionOpOfType
bool isaConvolutionOpOfType(LinalgOp op)
Returns true if the linalg op is a convolution op of type ConvOpTy.
Definition Utils.h:126

mlir::linalg::computeAllSliceParameters
SmallVector< std::optional< SliceParameters > > computeAllSliceParameters(OpBuilder &builder, Location loc, LinalgOp linalgOp, ValueRange valuesToTile, ArrayRef< OpFoldResult > ivs, ArrayRef< OpFoldResult > tileSizes, ArrayRef< OpFoldResult > sizeBounds, bool omitPartialTileCheck)
Computes SliceParamaters for all valuesToTile of the given linalgOp, assuming linalgOp is being fused...
Definition Utils.cpp:2799

mlir::linalg::makeTiledShape
Operation * makeTiledShape(OpBuilder &builder, Location loc, Value valueToTile, ArrayRef< OpFoldResult > tileSizes, AffineMap map, ArrayRef< OpFoldResult > lbs, ArrayRef< OpFoldResult > ubs, ArrayRef< OpFoldResult > subShapeSizes, bool omitPartialTileCheck)
Creates an extract_slice/subview op for a single valueToTile with builder.
Definition Utils.cpp:2601

mlir::linalg::ProcInfoCallBackFn
std::function< SmallVector< ProcInfo >( OpBuilder &b, Location loc, ArrayRef< Range > parallelLoopRanges)> ProcInfoCallBackFn
Definition Utils.h:331

mlir::linalg::makeComposedPadHighOp
Value makeComposedPadHighOp(OpBuilder &b, Location loc, RankedTensorType type, Value source, Value padding, bool nofold, ValueRange typeDynDims={})
Create a tensor::PadOp that pads source to the shape of type whose sizes are assumed to be greater th...
Definition Utils.cpp:2233

mlir::linalg::updateBoundsForCyclicDistribution
void updateBoundsForCyclicDistribution(OpBuilder &builder, Location loc, Value procId, Value nprocs, Value &lb, Value &ub, Value &step)
Update the lb, ub and step to get per processor lb, ub and step.
Definition Utils.cpp:2400

mlir::linalg::getPrunedAttributeList
SmallVector< NamedAttribute > getPrunedAttributeList(OpTy op)
Returns an attribute list that excludes pre-defined attributes.
Definition Utils.h:402

mlir::linalg::getTensorOutputTypes
SmallVector< Type > getTensorOutputTypes(LinalgOp op, ValueRange operands)
Returns the list of tensor output types produced when the given structured operation op is applied to...
Definition Utils.cpp:2761

mlir::linalg::computeSliceParameters
SliceParameters computeSliceParameters(OpBuilder &builder, Location loc, Value valueToTile, ArrayRef< OpFoldResult > tileSizes, AffineMap map, ArrayRef< OpFoldResult > lbs, ArrayRef< OpFoldResult > ubs, ArrayRef< OpFoldResult > subShapeSizes, bool omitPartialTileCheck)
Computes SliceParameters for a single valueToTile assuming that its user is being tiled with the give...
Definition Utils.cpp:2614

mlir::scf::ValueVector
SmallVector< Value > ValueVector
An owning vector of values, handy to return from functions.
Definition SCF.h:64

mlir::tensor
Definition BufferizationTransformOps.h:19

mlir::ub
Definition UBToLLVM.h:24

mlir
Include the generated interface declarations.
Definition AliasAnalysis.h:19

mlir::function_ref
llvm::function_ref< Fn > function_ref
Definition LLVM.h:144

mlir::linalg::DilationsAndStrides
A struct containing dilations and strides inferred from convolution ops.
Definition Utils.h:110

mlir::linalg::DilationsAndStrides::strides
SmallVector< int64_t > strides
Definition Utils.h:112

mlir::linalg::DilationsAndStrides::dilations
SmallVector< int64_t > dilations
Definition Utils.h:111

mlir::linalg::FusionInfo
A struct containing the Linalg producer before and after fusion.
Definition Utils.h:250

mlir::linalg::FusionInfo::originalProducer
LinalgOp originalProducer
Definition Utils.h:251

mlir::linalg::FusionInfo::fusedProducer
LinalgOp fusedProducer
Definition Utils.h:252

mlir::linalg::GenerateLoopNest
Utility class used to generate nested loops with ranges described by loopRanges and loop type describ...
Definition Utils.h:390

mlir::linalg::GenerateLoopNest::doit
static void doit(OpBuilder &b, Location loc, ArrayRef< Range > loopRanges, LinalgOp linalgOp, ArrayRef< utils::IteratorType > iteratorTypes, function_ref< scf::ValueVector(OpBuilder &, Location, ValueRange, ValueRange)> bodyBuilderFn, ArrayRef< linalg::ProcInfo > procInfo={})

mlir::linalg::LinalgLoopDistributionOptions
Options that allow distribution of loops generated in Linalg transforms to processors while generatin...
Definition Utils.h:336

mlir::linalg::LinalgLoopDistributionOptions::procInfo
ProcInfoCallBackFn procInfo
Callback function that returns the Values for processor ID (procId), and number of processors (nprocs...
Definition Utils.h:343

mlir::linalg::ProcInfo
Callback function type used to get processor ID, and number of processors used for distribution for a...
Definition Utils.h:326

mlir::linalg::ProcInfo::distributionMethod
DistributionMethod distributionMethod
Definition Utils.h:329

mlir::linalg::ProcInfo::nprocs
Value nprocs
Definition Utils.h:328

mlir::linalg::ProcInfo::procId
Value procId
Definition Utils.h:327

mlir::linalg::RegionMatcher
A struct containing common matchers over linalg op's region.
Definition Utils.h:361

mlir::linalg::RegionMatcher::matchAsScalarBinaryOp
static std::optional< BinaryOpKind > matchAsScalarBinaryOp(GenericOp op)
Matches the given linalg op if its body is performing binary operation on int or float scalar values ...
Definition Utils.cpp:95

mlir::linalg::RegionMatcher::BinaryOpKind
BinaryOpKind
Definition Utils.h:362

mlir::linalg::RegionMatcher::BinaryOpKind::IAdd
@ IAdd
Definition Utils.h:363

mlir::linalg::SliceParameters
A struct containg offsets-sizes-strides arguments of the tiled shape.
Definition Utils.h:172

mlir::linalg::SliceParameters::strides
SmallVector< OpFoldResult > strides
Definition Utils.h:175

mlir::linalg::SliceParameters::sizes
SmallVector< OpFoldResult > sizes
Definition Utils.h:174

mlir::linalg::SliceParameters::offsets
SmallVector< OpFoldResult > offsets
Definition Utils.h:173