28 namespace bufferization {
29 #define GEN_PASS_DEF_FINALIZINGBUFFERIZE
30 #define GEN_PASS_DEF_BUFFERIZATIONBUFFERIZE
31 #define GEN_PASS_DEF_ONESHOTBUFFERIZE
32 #include "mlir/Dialect/Bufferization/Transforms/Passes.h.inc"
36 #define DEBUG_TYPE "bufferize"
47 assert(inputs.size() == 1);
48 assert(isa<BaseMemRefType>(inputs[0].
getType()));
49 return builder.
create<bufferization::ToTensorOp>(loc, type, inputs[0]);
68 assert(inputs.size() == 1 &&
"expected exactly one input");
70 if (
auto inputType = dyn_cast<MemRefType>(inputs[0].
getType())) {
72 assert(inputType != type &&
"expected different types");
74 auto rankedDestType = dyn_cast<MemRefType>(type);
79 FailureOr<Value> replacement =
81 if (failed(replacement))
86 if (isa<TensorType>(inputs[0].
getType())) {
88 return builder.
create<bufferization::ToMemrefOp>(loc, type, inputs[0]);
91 llvm_unreachable(
"only tensor/memref input types supported");
97 target.
addLegalOp<bufferization::ToTensorOp, bufferization::ToMemrefOp>();
103 class BufferizeToTensorOp
108 matchAndRewrite(bufferization::ToTensorOp op, OpAdaptor adaptor,
110 rewriter.
replaceOp(op, adaptor.getMemref());
119 class BufferizeToMemrefOp
124 matchAndRewrite(bufferization::ToMemrefOp op, OpAdaptor adaptor,
126 rewriter.
replaceOp(op, adaptor.getTensor());
134 patterns.
add<BufferizeToTensorOp, BufferizeToMemrefOp>(typeConverter,
139 struct FinalizingBufferizePass
140 :
public bufferization::impl::FinalizingBufferizeBase<
141 FinalizingBufferizePass> {
142 using FinalizingBufferizeBase<
143 FinalizingBufferizePass>::FinalizingBufferizeBase;
145 void runOnOperation()
override {
146 auto func = getOperation();
163 target.markUnknownOpDynamicallyLegal(
171 static LayoutMapOption parseLayoutMapOption(
const std::string &s) {
172 if (s ==
"fully-dynamic-layout-map")
173 return LayoutMapOption::FullyDynamicLayoutMap;
174 if (s ==
"identity-layout-map")
175 return LayoutMapOption::IdentityLayoutMap;
176 if (s ==
"infer-layout-map")
177 return LayoutMapOption::InferLayoutMap;
178 llvm_unreachable(
"invalid layout map option");
182 parseHeuristicOption(
const std::string &s) {
183 if (s ==
"bottom-up")
187 if (s ==
"bottom-up-from-terminators")
192 llvm_unreachable(
"invalid analysisheuristic option");
195 struct OneShotBufferizePass
196 :
public bufferization::impl::OneShotBufferizeBase<OneShotBufferizePass> {
197 OneShotBufferizePass() =
default;
204 .
insert<bufferization::BufferizationDialect, memref::MemRefDialect>();
207 void runOnOperation()
override {
219 parseLayoutMapOption(functionBoundaryTypeConversion));
220 if (mustInferMemorySpace) {
222 [](
TensorType t) -> std::optional<Attribute> {
234 LayoutMapOption unknownTypeConversionOption =
235 parseLayoutMapOption(unknownTypeConversion);
236 if (unknownTypeConversionOption == LayoutMapOption::InferLayoutMap) {
238 "Invalid option: 'infer-layout-map' is not a valid value for "
239 "'unknown-type-conversion'");
240 return signalPassFailure();
244 auto tensorType = cast<TensorType>(value.
getType());
245 if (unknownTypeConversionOption == LayoutMapOption::IdentityLayoutMap)
247 tensorType, memorySpace);
248 assert(unknownTypeConversionOption ==
249 LayoutMapOption::FullyDynamicLayoutMap &&
250 "invalid layout map option");
258 if (this->dialectFilter.hasValue())
259 return llvm::is_contained(this->dialectFilter,
275 "Invalid option: 'copy-before-write' cannot be used with "
276 "'test-analysis-only'");
277 return signalPassFailure();
283 "Invalid option: 'print-conflicts' requires 'test-analysis-only'");
284 return signalPassFailure();
290 "Invalid option: 'dump-alias-sets' requires 'test-analysis-only'");
291 return signalPassFailure();
295 ModuleOp moduleOp = getOperation();
304 "Invalid option: 'no-analysis-func-filter' requires "
305 "'bufferize-function-boundaries'");
306 return signalPassFailure();
321 std::optional<OneShotBufferizationOptions>
options;
326 return std::make_unique<OneShotBufferizePass>();
331 return std::make_unique<OneShotBufferizePass>(
options);
334 std::unique_ptr<OperationPass<func::FuncOp>>
336 return std::make_unique<FinalizingBufferizePass>();
352 :
IRRewriter(ctx), erasedOps(erasedOps), toMemrefOps(toMemrefOps),
353 worklist(worklist), analysisState(
options), statistics(statistics) {
358 void notifyOperationErased(
Operation *op)
override {
359 erasedOps.insert(op);
361 toMemrefOps.erase(op);
364 void notifyOperationInserted(
Operation *op, InsertPoint previous)
override {
366 if (previous.isSet())
373 if (
auto sideEffectingOp = dyn_cast<MemoryEffectOpInterface>(op))
379 if (isa<ToMemrefOp>(op)) {
380 toMemrefOps.insert(op);
385 if (isa<ToTensorOp>(op))
393 auto const &
options = analysisState.getOptions();
398 worklist.push_back(op);
431 op->
walk([&](ToMemrefOp toMemrefOp) { toMemrefOps.insert(toMemrefOp); });
443 worklist.push_back(op);
450 BufferizationRewriter rewriter(op->
getContext(), erasedOps, toMemrefOps,
451 worklist,
options, statistics);
452 for (
unsigned i = 0; i < worklist.size(); ++i) {
455 if (erasedOps.contains(nextOp))
458 auto bufferizableOp =
options.dynCastBufferizableOp(nextOp);
465 if (!bufferizableOp.supportsUnstructuredControlFlow())
467 if (r.getBlocks().size() > 1)
469 "op or BufferizableOpInterface implementation does not support "
470 "unstructured control flow, but at least one region has multiple "
474 LLVM_DEBUG(llvm::dbgs()
475 <<
"//===-------------------------------------------===//\n"
476 <<
"IR after bufferizing: " << nextOp->
getName() <<
"\n");
477 rewriter.setInsertionPoint(nextOp);
478 if (failed(bufferizableOp.bufferize(rewriter,
options))) {
479 LLVM_DEBUG(llvm::dbgs()
480 <<
"failed to bufferize\n"
481 <<
"//===-------------------------------------------===//\n");
482 return nextOp->
emitError(
"failed to bufferize op");
484 LLVM_DEBUG(llvm::dbgs()
486 <<
"\n//===-------------------------------------------===//\n");
490 if (erasedOps.contains(op))
495 rewriter.setInsertionPoint(op);
497 rewriter, cast<ToMemrefOp>(op),
options);
502 if (toTensorOp->getUses().empty()) {
503 rewriter.eraseOp(toTensorOp);
516 if (erasedOps.contains(op))
529 if (isa<ToTensorOp, ToMemrefOp>(op))
531 return op->
emitError(
"op was not bufferized");
548 auto tensorType = dyn_cast<TensorType>(bbArg.getType());
550 newTypes.push_back(bbArg.getType());
554 FailureOr<BaseMemRefType> memrefType =
556 if (failed(memrefType))
558 newTypes.push_back(*memrefType);
562 for (
auto [bbArg, type] : llvm::zip(block->
getArguments(), newTypes)) {
563 if (bbArg.getType() == type)
569 bbArgUses.push_back(&use);
576 if (!bbArgUses.empty()) {
578 rewriter.
create<bufferization::ToTensorOp>(bbArg.getLoc(), bbArg);
580 use->set(toTensorOp);
586 auto branchOp = dyn_cast<BranchOpInterface>(op);
588 return op->
emitOpError(
"cannot bufferize ops with block references that "
589 "do not implement BranchOpInterface");
592 assert(it != op->
getSuccessors().end() &&
"could find successor");
593 int64_t successorIdx = std::distance(op->
getSuccessors().begin(), it);
597 for (
auto [operand, type] :
599 if (operand.getType() == type) {
601 newOperands.push_back(operand);
604 FailureOr<BaseMemRefType> operandBufferType =
606 if (failed(operandBufferType))
609 Value bufferizedOperand = rewriter.
create<bufferization::ToMemrefOp>(
610 operand.getLoc(), *operandBufferType, operand);
613 if (type != *operandBufferType)
614 bufferizedOperand = rewriter.
create<memref::CastOp>(
615 operand.getLoc(), type, bufferizedOperand);
616 newOperands.push_back(bufferizedOperand);
626 options.allowUnknownOps =
true;
627 options.copyBeforeWrite =
true;
628 options.enforceAliasingInvariants =
false;
632 cast<TensorType>(value.
getType()), memorySpace);
634 options.opFilter.allowDialect<BufferizationDialect>();
static Value materializeToTensor(OpBuilder &builder, TensorType type, ValueRange inputs, Location loc)
static MLIRContext * getContext(OpFoldResult val)
static llvm::ManagedStatic< PassManagerOptions > options
Base class for generic analysis states.
Attributes are known-constant values of operations.
This class provides a shared interface for ranked and unranked memref types.
This class represents an argument of a Block.
Block represents an ordered list of Operations.
BlockArgListType getArguments()
Operation * getParentOp()
Returns the closest surrounding operation that contains this block.
This class implements a pattern rewriter for use with ConversionPatterns.
void replaceOp(Operation *op, ValueRange newValues) override
Replace the given operation with the new values.
This class describes a specific conversion target.
void addLegalOp(OperationName op)
Register the given operations as legal.
The DialectRegistry maps a dialect namespace to a constructor for the matching dialect.
StringRef getNamespace() const
user_range getUsers() const
Returns a range of all users.
This class coordinates rewriting a piece of IR outside of a pattern rewrite, providing a way to keep ...
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
MLIRContext is the top-level object for a collection of MLIR operations.
void assign(ValueRange values)
Assign this range to the given values.
RAII guard to reset the insertion point of the builder when destroyed.
This class helps build Operations.
void setInsertionPointToStart(Block *block)
Sets the insertion point to the start of the specified block.
void setInsertionPointAfterValue(Value val)
Sets the insertion point to the node after the specified value.
Operation * create(const OperationState &state)
Creates an operation given the fields represented as an OperationState.
OpConversionPattern is a wrapper around ConversionPattern that allows for matching and rewriting agai...
OpConversionPattern(MLIRContext *context, PatternBenefit benefit=1)
This class represents an operand of an operation.
Operation is the basic unit of execution within MLIR.
Dialect * getDialect()
Return the dialect this operation is associated with, or nullptr if the associated dialect is not loa...
std::enable_if_t< llvm::function_traits< std::decay_t< FnT > >::num_args==1, RetT > walk(FnT &&callback)
Walk the operation by calling the callback for each nested operation (including this one),...
MLIRContext * getContext()
Return the context this operation is associated with.
InFlightDiagnostic emitError(const Twine &message={})
Emit an error about fatal conditions with this operation, reporting up to any diagnostic handlers tha...
MutableArrayRef< Region > getRegions()
Returns the regions held by this operation.
OperationName getName()
The name of an operation is the key identifier for it.
SuccessorRange getSuccessors()
use_range getUses()
Returns a range of all uses, which is useful for iterating over all uses.
InFlightDiagnostic emitOpError(const Twine &message={})
Emit an error with the op name prefixed, like "'dim' op " which is convenient for verifiers.
This class contains a list of basic blocks and a link to the parent operation it is attached to.
MLIRContext * getContext() const
RewritePatternSet & add(ConstructorArg &&arg, ConstructorArgs &&...args)
Add an instance of each of the pattern types 'Ts' to the pattern list with the given arguments.
This class coordinates the application of a rewrite on a set of IR, providing a way for clients to tr...
This class models how operands are forwarded to block arguments in control flow.
MutableOperandRange getMutableForwardedOperands() const
Get the range of operands that are simply forwarded to the successor.
OperandRange getForwardedOperands() const
Get the range of operands that are simply forwarded to the successor.
Tensor types represent multi-dimensional arrays, and have two variants: RankedTensorType and Unranked...
void addConversion(FnT &&callback)
Register a conversion function.
bool isLegal(Type type) const
Return true if the given type is legal for this type converter, i.e.
void addArgumentMaterialization(FnT &&callback)
All of the following materializations require function objects that are convertible to the following ...
void addSourceMaterialization(FnT &&callback)
This method registers a materialization that will be called when converting a legal replacement value...
void addTargetMaterialization(FnT &&callback)
This method registers a materialization that will be called when converting an illegal (source) value...
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
This class provides an abstraction over the different types of ranges over Values.
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Type getType() const
Return the type of this value.
static WalkResult advance()
AnalysisState provides a variety of helper functions for dealing with tensor values.
A helper type converter class that automatically populates the relevant materializations and type con...
BufferizeTypeConverter()
Registers conversions into BufferizeTypeConverter.
void allowOperation()
Allow the given ops.
LogicalResult runOneShotBufferize(Operation *op, const OneShotBufferizationOptions &options, BufferizationStatistics *statistics=nullptr)
Run One-Shot Bufferize on the given op: Analysis + Bufferization.
BaseMemRefType getMemRefTypeWithStaticIdentityLayout(TensorType tensorType, Attribute memorySpace=nullptr)
Return a MemRef type with a static identity layout (i.e., no layout map).
FailureOr< Value > castOrReallocMemRefValue(OpBuilder &b, Value value, MemRefType type, const BufferizationOptions &options)
Try to cast the given ranked MemRef-typed value to the given ranked MemRef type.
llvm::LogicalResult runOneShotModuleBufferize(ModuleOp moduleOp, const bufferization::OneShotBufferizationOptions &options, BufferizationStatistics *statistics=nullptr)
Run One-Shot Module Bufferization on the given module.
void populateBufferizeMaterializationLegality(ConversionTarget &target)
Marks ops used by bufferization for type conversion materializations as "legal" in the given Conversi...
LogicalResult bufferizeOp(Operation *op, const BufferizationOptions &options, BufferizationStatistics *statistics=nullptr)
Bufferize op and its nested ops that implement BufferizableOpInterface.
LogicalResult insertTensorCopies(Operation *op, const OneShotBufferizationOptions &options, BufferizationStatistics *statistics=nullptr)
Resolve RaW and other conflicts by inserting bufferization.alloc_tensor ops.
std::unique_ptr< OperationPass< func::FuncOp > > createFinalizingBufferizePass()
Creates a pass that finalizes a partial bufferization by removing remaining bufferization....
LogicalResult bufferizeBlockSignature(Block *block, RewriterBase &rewriter, const BufferizationOptions &options)
Bufferize the signature of block and its callers (i.e., ops that have the given block as a successor)...
std::unique_ptr< Pass > createOneShotBufferizePass()
Create a pass that bufferizes all ops that implement BufferizableOpInterface with One-Shot Bufferize.
LogicalResult foldToMemrefToTensorPair(RewriterBase &rewriter, ToMemrefOp toMemref, const BufferizationOptions &options)
Try to fold to_memref(to_tensor(x)).
FailureOr< BaseMemRefType > getBufferType(Value value, const BufferizationOptions &options)
Return the buffer type for a given Value (tensor) after bufferization without bufferizing any IR.
BufferizationOptions getPartialBufferizationOptions()
Return BufferizationOptions such that the bufferizeOp behaves like the old (deprecated) partial,...
void populateEliminateBufferizeMaterializationsPatterns(const BufferizeTypeConverter &typeConverter, RewritePatternSet &patterns)
Populate patterns to eliminate bufferize materializations.
BaseMemRefType getMemRefTypeWithFullyDynamicLayout(TensorType tensorType, Attribute memorySpace=nullptr)
Return a MemRef type with fully dynamic layout.
bool hasTensorSemantics(Operation *op)
Return "true" if the given op has tensor semantics and should be bufferized.
Include the generated interface declarations.
Type getType(OpFoldResult ofr)
Returns the int type of the integer in ofr.
InFlightDiagnostic emitError(Location loc)
Utility method to emit an error message using this location.
LogicalResult applyFullConversion(ArrayRef< Operation * > ops, const ConversionTarget &target, const FrozenRewritePatternSet &patterns, ConversionConfig config=ConversionConfig())
Apply a complete conversion on the given operations, and all nested operations.
bool isMemoryEffectFree(Operation *op)
Returns true if the given operation is free of memory effects.
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
The following effect indicates that the operation allocates from some resource.
Options for BufferizableOpInterface-based bufferization.
bool copyBeforeWrite
If set to true, the analysis is skipped.
void setFunctionBoundaryTypeConversion(LayoutMapOption layoutMapOption)
This function controls buffer types on function signatures.
bool allowUnknownOps
Specifies whether not bufferizable ops are allowed in the input.
unsigned int bufferAlignment
Buffer alignment for new memory allocations.
bool printConflicts
If set to true, the IR is annotated with details about RaW conflicts.
bool testAnalysisOnly
If set to true, does not modify the IR apart from adding attributes (for checking the results of the ...
OpFilter opFilter
A filter that specifies which ops should be bufferized and which ops should be ignored.
bool checkParallelRegions
UnknownTypeConverterFn unknownTypeConverterFn
Type converter from tensors to memrefs.
bool bufferizeFunctionBoundaries
Specifies whether function boundaries (ops in the func dialect) should be bufferized or not.
DefaultMemorySpaceFn defaultMemorySpaceFn
Bufferization statistics for debugging.
int64_t numTensorOutOfPlace
Options for analysis-enabled bufferization.
unsigned analysisFuzzerSeed
Seed for the analysis fuzzer.
bool dumpAliasSets
Specifies whether the tensor IR should be annotated with alias sets.
bool allowReturnAllocsFromLoops
Specifies whether returning newly allocated memrefs from loops should be allowed.
AnalysisHeuristic analysisHeuristic
The heuristic controls the order in which ops are traversed during the analysis.
@ BottomUpFromTerminators
llvm::ArrayRef< std::string > noAnalysisFuncFilter
Specify the functions that should not be analyzed.
std::function< bool(Operation *)> FilterFn
If the filter function evaluates to true, the filter matches.