doxygen/BufferDeallocation_8cpp_source.html

 //===- BufferDeallocation.cpp - the impl for buffer deallocation ----------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//

 //

 // This file implements logic for computing correct alloc and dealloc positions.

 // Furthermore, buffer deallocation also adds required new clone operations to

 // ensure that all buffers are deallocated. The main class is the

 // BufferDeallocationPass class that implements the underlying algorithm. In

 // order to put allocations and deallocations at safe positions, it is

 // significantly important to put them into the correct blocks. However, the

 // liveness analysis does not pay attention to aliases, which can occur due to

 // branches (and their associated block arguments) in general. For this purpose,

 // BufferDeallocation firstly finds all possible aliases for a single value

 // (using the BufferViewFlowAnalysis class). Consider the following example:

 //

 // ^bb0(%arg0):

 //   cf.cond_br %cond, ^bb1, ^bb2

 // ^bb1:

 //   cf.br ^exit(%arg0)

 // ^bb2:

 //   %new_value = ...

 //   cf.br ^exit(%new_value)

 // ^exit(%arg1):

 //   return %arg1;

 //

 // We should place the dealloc for %new_value in exit. However, we have to free

 // the buffer in the same block, because it cannot be freed in the post

 // dominator. However, this requires a new clone buffer for %arg1 that will

 // contain the actual contents. Using the class BufferViewFlowAnalysis, we

 // will find out that %new_value has a potential alias %arg1. In order to find

 // the dealloc position we have to find all potential aliases, iterate over

 // their uses and find the common post-dominator block (note that additional

 // clones and buffers remove potential aliases and will influence the placement

 // of the deallocs). In all cases, the computed block can be safely used to free

 // the %new_value buffer (may be exit or bb2) as it will die and we can use

 // liveness information to determine the exact operation after which we have to

 // insert the dealloc. However, the algorithm supports introducing clone buffers

 // and placing deallocs in safe locations to ensure that all buffers will be

 // freed in the end.

 //

 // TODO:

 // The current implementation does not support explicit-control-flow loops and

 // the resulting code will be invalid with respect to program semantics.

 // However, structured control-flow loops are fully supported. Furthermore, it

 // doesn't accept functions which return buffers already.

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Dialect/Bufferization/Transforms/Passes.h"


 #include "mlir/Dialect/Bufferization/IR/AllocationOpInterface.h"

 #include "mlir/Dialect/Bufferization/IR/Bufferization.h"

 #include "mlir/Dialect/Bufferization/Transforms/BufferUtils.h"

 #include "mlir/Dialect/Func/IR/FuncOps.h"

 #include "mlir/Dialect/MemRef/IR/MemRef.h"

 #include "llvm/ADT/SetOperations.h"


 namespace mlir {

 namespace bufferization {

 #define GEN_PASS_DEF_BUFFERDEALLOCATION

 #include "mlir/Dialect/Bufferization/Transforms/Passes.h.inc"

 } // namespace bufferization

 } // namespace mlir


 using namespace mlir;

 using namespace mlir::bufferization;


 /// Walks over all immediate return-like terminators in the given region.

 static LogicalResult walkReturnOperations(

     Region *region,

     llvm::function_ref<LogicalResult(RegionBranchTerminatorOpInterface)> func) {

   for (Block &block : *region) {

     Operation *terminator = block.getTerminator();

     // Skip non region-return-like terminators.

     if (auto regionTerminator =

             dyn_cast<RegionBranchTerminatorOpInterface>(terminator)) {

       if (failed(func(regionTerminator)))

         return failure();

     }

   }

   return success();

 }


 /// Checks if all operations that have at least one attached region implement

 /// the RegionBranchOpInterface. This is not required in edge cases, where we

 /// have a single attached region and the parent operation has no results.

 static bool validateSupportedControlFlow(Operation *op) {

   WalkResult result = op->walk([&](Operation *operation) {

     // Only check ops that are inside a function.

     if (!operation->getParentOfType<func::FuncOp>())

       return WalkResult::advance();


     auto regions = operation->getRegions();

     // Walk over all operations in a region and check if the operation has at

     // least one region and implements the RegionBranchOpInterface. If there

     // is an operation that does not fulfill this condition, we cannot apply

     // the deallocation steps. Furthermore, we accept cases, where we have a

     // region that returns no results, since, in that case, the intra-region

     // control flow does not affect the transformation.

     size_t size = regions.size();

     if (((size == 1 && !operation->getResults().empty()) || size > 1) &&

         !dyn_cast<RegionBranchOpInterface>(operation)) {

       operation->emitError("All operations with attached regions need to "

                            "implement the RegionBranchOpInterface.");

     }


     return WalkResult::advance();

   });

   return !result.wasSkipped();

 }


 namespace {


 //===----------------------------------------------------------------------===//

 // Backedges analysis

 //===----------------------------------------------------------------------===//


 /// A straight-forward program analysis which detects loop backedges induced by

 /// explicit control flow.

 class Backedges {

 public:

   using BlockSetT = SmallPtrSet<Block *, 16>;

   using BackedgeSetT = llvm::DenseSet<std::pair<Block *, Block *>>;


 public:

   /// Constructs a new backedges analysis using the op provided.

   Backedges(Operation *op) { recurse(op); }


   /// Returns the number of backedges formed by explicit control flow.

   size_t size() const { return edgeSet.size(); }


   /// Returns the start iterator to loop over all backedges.

   BackedgeSetT::const_iterator begin() const { return edgeSet.begin(); }


   /// Returns the end iterator to loop over all backedges.

   BackedgeSetT::const_iterator end() const { return edgeSet.end(); }


 private:

   /// Enters the current block and inserts a backedge into the `edgeSet` if we

   /// have already visited the current block. The inserted edge links the given

   /// `predecessor` with the `current` block.

   bool enter(Block &current, Block *predecessor) {

     bool inserted = visited.insert(&current).second;

     if (!inserted)

       edgeSet.insert(std::make_pair(predecessor, &current));

     return inserted;

   }


   /// Leaves the current block.

   void exit(Block &current) { visited.erase(&current); }


   /// Recurses into the given operation while taking all attached regions into

   /// account.

   void recurse(Operation *op) {

     Block *current = op->getBlock();

     // If the current op implements the `BranchOpInterface`, there can be

     // cycles in the scope of all successor blocks.

     if (isa<BranchOpInterface>(op)) {

       for (Block *succ : current->getSuccessors())

         recurse(*succ, current);

     }

     // Recurse into all distinct regions and check for explicit control-flow

     // loops.

     for (Region &region : op->getRegions()) {

       if (!region.empty())

         recurse(region.front(), current);

     }

   }


   /// Recurses into explicit control-flow structures that are given by

   /// the successor relation defined on the block level.

   void recurse(Block &block, Block *predecessor) {

     // Try to enter the current block. If this is not possible, we are

     // currently processing this block and can safely return here.

     if (!enter(block, predecessor))

       return;


     // Recurse into all operations and successor blocks.

     for (Operation &op : block.getOperations())

       recurse(&op);


     // Leave the current block.

     exit(block);

   }


   /// Stores all blocks that are currently visited and on the processing stack.

   BlockSetT visited;


   /// Stores all backedges in the format (source, target).

   BackedgeSetT edgeSet;

 };


 //===----------------------------------------------------------------------===//

 // BufferDeallocation

 //===----------------------------------------------------------------------===//


 /// The buffer deallocation transformation which ensures that all allocs in the

 /// program have a corresponding de-allocation. As a side-effect, it might also

 /// introduce clones that in turn leads to additional deallocations.

 class BufferDeallocation : public BufferPlacementTransformationBase {

 public:

   using AliasAllocationMapT =

       llvm::DenseMap<Value, bufferization::AllocationOpInterface>;


   BufferDeallocation(Operation *op)

       : BufferPlacementTransformationBase(op), dominators(op),

         postDominators(op) {}


   /// Checks if all allocation operations either provide an already existing

   /// deallocation operation or implement the AllocationOpInterface. In

   /// addition, this method initializes the internal alias to

   /// AllocationOpInterface mapping in order to get compatible

   /// AllocationOpInterface implementations for aliases.

   LogicalResult prepare() {

     for (const BufferPlacementAllocs::AllocEntry &entry : allocs) {

       // Get the defining allocation operation.

       Value alloc = std::get<0>(entry);

       auto allocationInterface =

           alloc.getDefiningOp<bufferization::AllocationOpInterface>();

       // If there is no existing deallocation operation and no implementation of

       // the AllocationOpInterface, we cannot apply the BufferDeallocation pass.

       if (!std::get<1>(entry) && !allocationInterface) {

         return alloc.getDefiningOp()->emitError(

             "Allocation is not deallocated explicitly nor does the operation "

             "implement the AllocationOpInterface.");

       }


       // Register the current allocation interface implementation.

       aliasToAllocations[alloc] = allocationInterface;


       // Get the alias information for the current allocation node.

       for (Value alias : aliases.resolve(alloc)) {

         // TODO: check for incompatible implementations of the

         // AllocationOpInterface. This could be realized by promoting the

         // AllocationOpInterface to a DialectInterface.

         aliasToAllocations[alias] = allocationInterface;

       }

     }

     return success();

   }


   /// Performs the actual placement/creation of all temporary clone and dealloc

   /// nodes.

   LogicalResult deallocate() {

     // Add additional clones that are required.

     if (failed(introduceClones()))

       return failure();


     // Place deallocations for all allocation entries.

     return placeDeallocs();

   }


 private:

   /// Introduces required clone operations to avoid memory leaks.

   LogicalResult introduceClones() {

     // Initialize the set of values that require a dedicated memory free

     // operation since their operands cannot be safely deallocated in a post

     // dominator.

     SetVector<Value> valuesToFree;

     llvm::SmallDenseSet<std::tuple<Value, Block *>> visitedValues;

     SmallVector<std::tuple<Value, Block *>, 8> toProcess;


     // Check dominance relation for proper dominance properties. If the given

     // value node does not dominate an alias, we will have to create a clone in

     // order to free all buffers that can potentially leak into a post

     // dominator.

     auto findUnsafeValues = [&](Value source, Block *definingBlock) {

       auto it = aliases.find(source);

       if (it == aliases.end())

         return;

       for (Value value : it->second) {

         if (valuesToFree.count(value) > 0)

           continue;

         Block *parentBlock = value.getParentBlock();

         // Check whether we have to free this particular block argument or

         // generic value. We have to free the current alias if it is either

         // defined in a non-dominated block or it is defined in the same block

         // but the current value is not dominated by the source value.

         if (!dominators.dominates(definingBlock, parentBlock) ||

             (definingBlock == parentBlock && isa<BlockArgument>(value))) {

           toProcess.emplace_back(value, parentBlock);

           valuesToFree.insert(value);

         } else if (visitedValues.insert(std::make_tuple(value, definingBlock))

                        .second)

           toProcess.emplace_back(value, definingBlock);

       }

     };


     // Detect possibly unsafe aliases starting from all allocations.

     for (BufferPlacementAllocs::AllocEntry &entry : allocs) {

       Value allocValue = std::get<0>(entry);

       findUnsafeValues(allocValue, allocValue.getDefiningOp()->getBlock());

     }

     // Try to find block arguments that require an explicit free operation

     // until we reach a fix point.

     while (!toProcess.empty()) {

       auto current = toProcess.pop_back_val();

       findUnsafeValues(std::get<0>(current), std::get<1>(current));

     }


     // Update buffer aliases to ensure that we free all buffers and block

     // arguments at the correct locations.

     aliases.remove(valuesToFree);


     // Add new allocs and additional clone operations.

     for (Value value : valuesToFree) {

       if (failed(isa<BlockArgument>(value)

                      ? introduceBlockArgCopy(cast<BlockArgument>(value))

                      : introduceValueCopyForRegionResult(value)))

         return failure();


       // Register the value to require a final dealloc. Note that we do not have

       // to assign a block here since we do not want to move the allocation node

       // to another location.

       allocs.registerAlloc(std::make_tuple(value, nullptr));

     }

     return success();

   }


   /// Introduces temporary clones in all predecessors and copies the source

   /// values into the newly allocated buffers.

   LogicalResult introduceBlockArgCopy(BlockArgument blockArg) {

     // Allocate a buffer for the current block argument in the block of

     // the associated value (which will be a predecessor block by

     // definition).

     Block *block = blockArg.getOwner();

     for (auto it = block->pred_begin(), e = block->pred_end(); it != e; ++it) {

       // Get the terminator and the value that will be passed to our

       // argument.

       Operation *terminator = (*it)->getTerminator();

       auto branchInterface = cast<BranchOpInterface>(terminator);

       SuccessorOperands operands =

           branchInterface.getSuccessorOperands(it.getSuccessorIndex());


       // Query the associated source value.

       Value sourceValue = operands[blockArg.getArgNumber()];

       if (!sourceValue) {

         return failure();

       }

       // Wire new clone and successor operand.

       // Create a new clone at the current location of the terminator.

       auto clone = introduceCloneBuffers(sourceValue, terminator);

       if (failed(clone))

         return failure();

       operands.slice(blockArg.getArgNumber(), 1).assign(*clone);

     }


     // Check whether the block argument has implicitly defined predecessors via

     // the RegionBranchOpInterface. This can be the case if the current block

     // argument belongs to the first block in a region and the parent operation

     // implements the RegionBranchOpInterface.

     Region *argRegion = block->getParent();

     Operation *parentOp = argRegion->getParentOp();

     RegionBranchOpInterface regionInterface;

     if (&argRegion->front() != block ||

         !(regionInterface = dyn_cast<RegionBranchOpInterface>(parentOp)))

       return success();


     if (failed(introduceClonesForRegionSuccessors(

             regionInterface, argRegion->getParentOp()->getRegions(), blockArg,

             [&](RegionSuccessor &successorRegion) {

               // Find a predecessor of our argRegion.

               return successorRegion.getSuccessor() == argRegion;

             })))

       return failure();


     // Check whether the block argument belongs to an entry region of the

     // parent operation. In this case, we have to introduce an additional clone

     // for buffer that is passed to the argument.

     SmallVector<RegionSuccessor, 2> successorRegions;

     regionInterface.getSuccessorRegions(/*point=*/RegionBranchPoint::parent(),

                                         successorRegions);

     auto *it =

         llvm::find_if(successorRegions, [&](RegionSuccessor &successorRegion) {

           return successorRegion.getSuccessor() == argRegion;

         });

     if (it == successorRegions.end())

       return success();


     // Determine the actual operand to introduce a clone for and rewire the

     // operand to point to the clone instead.

     auto operands = regionInterface.getEntrySuccessorOperands(argRegion);

     size_t operandIndex =

         llvm::find(it->getSuccessorInputs(), blockArg).getIndex() +

         operands.getBeginOperandIndex();

     Value operand = parentOp->getOperand(operandIndex);

     assert(operand ==

                operands[operandIndex - operands.getBeginOperandIndex()] &&

            "region interface operands don't match parentOp operands");

     auto clone = introduceCloneBuffers(operand, parentOp);

     if (failed(clone))

       return failure();


     parentOp->setOperand(operandIndex, *clone);

     return success();

   }


   /// Introduces temporary clones in front of all associated nested-region

   /// terminators and copies the source values into the newly allocated buffers.

   LogicalResult introduceValueCopyForRegionResult(Value value) {

     // Get the actual result index in the scope of the parent terminator.

     Operation *operation = value.getDefiningOp();

     auto regionInterface = cast<RegionBranchOpInterface>(operation);

     // Filter successors that return to the parent operation.

     auto regionPredicate = [&](RegionSuccessor &successorRegion) {

       // If the RegionSuccessor has no associated successor, it will return to

       // its parent operation.

       return !successorRegion.getSuccessor();

     };

     // Introduce a clone for all region "results" that are returned to the

     // parent operation. This is required since the parent's result value has

     // been considered critical. Therefore, the algorithm assumes that a clone

     // of a previously allocated buffer is returned by the operation (like in

     // the case of a block argument).

     return introduceClonesForRegionSuccessors(

         regionInterface, operation->getRegions(), value, regionPredicate);

   }


   /// Introduces buffer clones for all terminators in the given regions. The

   /// regionPredicate is applied to every successor region in order to restrict

   /// the clones to specific regions.

   template <typename TPredicate>

   LogicalResult introduceClonesForRegionSuccessors(

       RegionBranchOpInterface regionInterface, MutableArrayRef<Region> regions,

       Value argValue, const TPredicate &regionPredicate) {

     for (Region &region : regions) {

       // Query the regionInterface to get all successor regions of the current

       // one.

       SmallVector<RegionSuccessor, 2> successorRegions;

       regionInterface.getSuccessorRegions(region, successorRegions);

       // Try to find a matching region successor.

       RegionSuccessor *regionSuccessor =

           llvm::find_if(successorRegions, regionPredicate);

       if (regionSuccessor == successorRegions.end())

         continue;

       // Get the operand index in the context of the current successor input

       // bindings.

       size_t operandIndex =

           llvm::find(regionSuccessor->getSuccessorInputs(), argValue)

               .getIndex();


       // Iterate over all immediate terminator operations to introduce

       // new buffer allocations. Thereby, the appropriate terminator operand

       // will be adjusted to point to the newly allocated buffer instead.

       if (failed(walkReturnOperations(

               &region, [&](RegionBranchTerminatorOpInterface terminator) {

                 // Get the actual mutable operands for this terminator op.

                 auto terminatorOperands =

                     terminator.getMutableSuccessorOperands(*regionSuccessor);

                 // Extract the source value from the current terminator.

                 // This conversion needs to exist on a separate line due to a

                 // bug in GCC conversion analysis.

                 OperandRange immutableTerminatorOperands = terminatorOperands;

                 Value sourceValue = immutableTerminatorOperands[operandIndex];

                 // Create a new clone at the current location of the terminator.

                 auto clone = introduceCloneBuffers(sourceValue, terminator);

                 if (failed(clone))

                   return failure();

                 // Wire clone and terminator operand.

                 terminatorOperands.slice(operandIndex, 1).assign(*clone);

                 return success();

               })))

         return failure();

     }

     return success();

   }


   /// Creates a new memory allocation for the given source value and clones

   /// its content into the newly allocated buffer. The terminator operation is

   /// used to insert the clone operation at the right place.

   FailureOr<Value> introduceCloneBuffers(Value sourceValue,

                                          Operation *terminator) {

     // Avoid multiple clones of the same source value. This can happen in the

     // presence of loops when a branch acts as a backedge while also having

     // another successor that returns to its parent operation. Note: that

     // copying copied buffers can introduce memory leaks since the invariant of

     // BufferDeallocation assumes that a buffer will be only cloned once into a

     // temporary buffer. Hence, the construction of clone chains introduces

     // additional allocations that are not tracked automatically by the

     // algorithm.

     if (clonedValues.contains(sourceValue))

       return sourceValue;

     // Create a new clone operation that copies the contents of the old

     // buffer to the new one.

     auto clone = buildClone(terminator, sourceValue);

     if (succeeded(clone)) {

       // Remember the clone of original source value.

       clonedValues.insert(*clone);

     }

     return clone;

   }


   /// Finds correct dealloc positions according to the algorithm described at

   /// the top of the file for all alloc nodes and block arguments that can be

   /// handled by this analysis.

   LogicalResult placeDeallocs() {

     // Move or insert deallocs using the previously computed information.

     // These deallocations will be linked to their associated allocation nodes

     // since they don't have any aliases that can (potentially) increase their

     // liveness.

     for (const BufferPlacementAllocs::AllocEntry &entry : allocs) {

       Value alloc = std::get<0>(entry);

       auto aliasesSet = aliases.resolve(alloc);

       assert(!aliasesSet.empty() && "must contain at least one alias");


       // Determine the actual block to place the dealloc and get liveness

       // information.

       Block *placementBlock =

           findCommonDominator(alloc, aliasesSet, postDominators);

       const LivenessBlockInfo *livenessInfo =

           liveness.getLiveness(placementBlock);


       // We have to ensure that the dealloc will be after the last use of all

       // aliases of the given value. We first assume that there are no uses in

       // the placementBlock and that we can safely place the dealloc at the

       // beginning.

       Operation *endOperation = &placementBlock->front();


       // Iterate over all aliases and ensure that the endOperation will point

       // to the last operation of all potential aliases in the placementBlock.

       for (Value alias : aliasesSet) {

         // Ensure that the start operation is at least the defining operation of

         // the current alias to avoid invalid placement of deallocs for aliases

         // without any uses.

         Operation *beforeOp = endOperation;

         if (alias.getDefiningOp() &&

             !(beforeOp = placementBlock->findAncestorOpInBlock(

                   *alias.getDefiningOp())))

           continue;


         Operation *aliasEndOperation =

             livenessInfo->getEndOperation(alias, beforeOp);

         // Check whether the aliasEndOperation lies in the desired block and

         // whether it is behind the current endOperation. If yes, this will be

         // the new endOperation.

         if (aliasEndOperation->getBlock() == placementBlock &&

             endOperation->isBeforeInBlock(aliasEndOperation))

           endOperation = aliasEndOperation;

       }

       // endOperation is the last operation behind which we can safely store

       // the dealloc taking all potential aliases into account.


       // If there is an existing dealloc, move it to the right place.

       Operation *deallocOperation = std::get<1>(entry);

       if (deallocOperation) {

         deallocOperation->moveAfter(endOperation);

       } else {

         // If the Dealloc position is at the terminator operation of the

         // block, then the value should escape from a deallocation.

         Operation *nextOp = endOperation->getNextNode();

         if (!nextOp)

           continue;

         // If there is no dealloc node, insert one in the right place.

         if (failed(buildDealloc(nextOp, alloc)))

           return failure();

       }

     }

     return success();

   }


   /// Builds a deallocation operation compatible with the given allocation

   /// value. If there is no registered AllocationOpInterface implementation for

   /// the given value (e.g. in the case of a function parameter), this method

   /// builds a memref::DeallocOp.

   LogicalResult buildDealloc(Operation *op, Value alloc) {

     OpBuilder builder(op);

     auto it = aliasToAllocations.find(alloc);

     if (it != aliasToAllocations.end()) {

       // Call the allocation op interface to build a supported and

       // compatible deallocation operation.

       auto dealloc = it->second.buildDealloc(builder, alloc);

       if (!dealloc)

         return op->emitError()

                << "allocations without compatible deallocations are "

                   "not supported";

     } else {

       // Build a "default" DeallocOp for unknown allocation sources.

       builder.create<memref::DeallocOp>(alloc.getLoc(), alloc);

     }

     return success();

   }


   /// Builds a clone operation compatible with the given allocation value. If

   /// there is no registered AllocationOpInterface implementation for the given

   /// value (e.g. in the case of a function parameter), this method builds a

   /// bufferization::CloneOp.

   FailureOr<Value> buildClone(Operation *op, Value alloc) {

     OpBuilder builder(op);

     auto it = aliasToAllocations.find(alloc);

     if (it != aliasToAllocations.end()) {

       // Call the allocation op interface to build a supported and

       // compatible clone operation.

       auto clone = it->second.buildClone(builder, alloc);

       if (clone)

         return *clone;

       return (LogicalResult)(op->emitError()

                              << "allocations without compatible clone ops "

                                 "are not supported");

     }

     // Build a "default" CloneOp for unknown allocation sources.

     return builder.create<bufferization::CloneOp>(alloc.getLoc(), alloc)

         .getResult();

   }


   /// The dominator info to find the appropriate start operation to move the

   /// allocs.

   DominanceInfo dominators;


   /// The post dominator info to move the dependent allocs in the right

   /// position.

   PostDominanceInfo postDominators;


   /// Stores already cloned buffers to avoid additional clones of clones.

   ValueSetT clonedValues;


   /// Maps aliases to their source allocation interfaces (inverse mapping).

   AliasAllocationMapT aliasToAllocations;

 };


 //===----------------------------------------------------------------------===//

 // BufferDeallocationPass

 //===----------------------------------------------------------------------===//


 /// The actual buffer deallocation pass that inserts and moves dealloc nodes

 /// into the right positions. Furthermore, it inserts additional clones if

 /// necessary. It uses the algorithm described at the top of the file.

 struct BufferDeallocationPass

     : public bufferization::impl::BufferDeallocationBase<

           BufferDeallocationPass> {

   void getDependentDialects(DialectRegistry &registry) const override {

     registry.insert<bufferization::BufferizationDialect>();

     registry.insert<memref::MemRefDialect>();

   }


   void runOnOperation() override {

     func::FuncOp func = getOperation();

     if (func.isExternal())

       return;


     if (failed(deallocateBuffers(func)))

       signalPassFailure();

   }

 };


 } // namespace


 LogicalResult bufferization::deallocateBuffers(Operation *op) {

   if (isa<ModuleOp>(op)) {

     WalkResult result = op->walk([&](func::FuncOp funcOp) {

       if (failed(deallocateBuffers(funcOp)))

         return WalkResult::interrupt();

       return WalkResult::advance();

     });

     return success(!result.wasInterrupted());

   }


   // Ensure that there are supported loops only.

   Backedges backedges(op);

   if (backedges.size()) {

     op->emitError("Only structured control-flow loops are supported.");

     return failure();

   }


   // Check that the control flow structures are supported.

   if (!validateSupportedControlFlow(op))

     return failure();


   // Gather all required allocation nodes and prepare the deallocation phase.

   BufferDeallocation deallocation(op);


   // Check for supported AllocationOpInterface implementations and prepare the

   // internal deallocation pass.

   if (failed(deallocation.prepare()))

     return failure();


   // Place all required temporary clone and dealloc nodes.

   if (failed(deallocation.deallocate()))

     return failure();


   return success();

 }


 //===----------------------------------------------------------------------===//

 // BufferDeallocationPass construction

 //===----------------------------------------------------------------------===//


 std::unique_ptr<Pass> mlir::bufferization::createBufferDeallocationPass() {

   return std::make_unique<BufferDeallocationPass>();

 }

AllocationOpInterface.h

walkReturnOperations
static LogicalResult walkReturnOperations(Region *region, llvm::function_ref< LogicalResult(RegionBranchTerminatorOpInterface)> func)
Walks over all immediate return-like terminators in the given region.
Definition: BufferDeallocation.cpp:73

validateSupportedControlFlow
static bool validateSupportedControlFlow(Operation *op)
Checks if all operations that have at least one attached region implement the RegionBranchOpInterface...
Definition: BufferDeallocation.cpp:91

BufferUtils.h

Bufferization.h

Passes.h

FuncOps.h

llvm::DenseMap
Definition: LLVM.h:55

llvm::DenseSet
Definition: LLVM.h:59

llvm::MutableArrayRef
Definition: LLVM.h:62

llvm::SetVector
Definition: LLVM.h:66

llvm::SmallPtrSet
Definition: LLVM.h:68

llvm::SmallVector
Definition: LLVM.h:72

llvm::function_ref
Definition: LLVM.h:90

mlir::BlockArgument
This class represents an argument of a Block.
Definition: Value.h:319

mlir::BlockArgument::getOwner
Block * getOwner() const
Returns the block that owns this argument.
Definition: Value.h:328

mlir::BlockArgument::getArgNumber
unsigned getArgNumber() const
Returns the number of this argument.
Definition: Value.h:331

mlir::Block
Block represents an ordered list of Operations.
Definition: Block.h:33

mlir::Block::findAncestorOpInBlock
Operation * findAncestorOpInBlock(Operation &op)
Returns 'op' if 'op' lies in this block, or otherwise finds the ancestor operation of 'op' that lies ...
Definition: Block.cpp:76

mlir::Block::getParent
Region * getParent() const
Provide a 'getParent' method for ilist_node_with_parent methods.
Definition: Block.cpp:29

mlir::Block::pred_begin
pred_iterator pred_begin()
Definition: Block.h:233

mlir::Block::getSuccessors
SuccessorRange getSuccessors()
Definition: Block.h:267

mlir::Block::getOperations
OpListType & getOperations()
Definition: Block.h:137

mlir::Block::front
Operation & front()
Definition: Block.h:153

mlir::Block::pred_end
pred_iterator pred_end()
Definition: Block.h:236

mlir::DialectRegistry
The DialectRegistry maps a dialect namespace to a constructor for the matching dialect.
Definition: DialectRegistry.h:139

mlir::DialectRegistry::insert
void insert()
Definition: DialectRegistry.h:148

mlir::DominanceInfo
A class for computing basic dominance information.
Definition: Dominance.h:140

mlir::LivenessBlockInfo
This class represents liveness information on block level.
Definition: Liveness.h:99

mlir::LivenessBlockInfo::getEndOperation
Operation * getEndOperation(Value value, Operation *startOperation) const
Gets the end operation for the given value using the start operation provided (must be referenced in ...
Definition: Liveness.cpp:379

mlir::MutableOperandRange::assign
void assign(ValueRange values)
Assign this range to the given values.
Definition: OperationSupport.cpp:467

mlir::OpBuilder
This class helps build Operations.
Definition: Builders.h:216

mlir::OperandRange
This class implements the operand iterators for the Operation class.
Definition: ValueRange.h:42

mlir::Operation
Operation is the basic unit of execution within MLIR.
Definition: Operation.h:88

mlir::Operation::getOperand
Value getOperand(unsigned idx)
Definition: Operation.h:350

mlir::Operation::setOperand
void setOperand(unsigned idx, Value value)
Definition: Operation.h:351

mlir::Operation::isBeforeInBlock
bool isBeforeInBlock(Operation *other)
Given an operation 'other' that is within the same parent block, return whether the current operation...
Definition: Operation.cpp:386

mlir::Operation::walk
std::enable_if_t< llvm::function_traits< std::decay_t< FnT > >::num_args==1, RetT > walk(FnT &&callback)
Walk the operation by calling the callback for each nested operation (including this one),...
Definition: Operation.h:798

mlir::Operation::create
static Operation * create(Location location, OperationName name, TypeRange resultTypes, ValueRange operands, NamedAttrList &&attributes, OpaqueProperties properties, BlockRange successors, unsigned numRegions)
Create a new Operation with the specific fields.
Definition: Operation.cpp:67

mlir::Operation::emitError
InFlightDiagnostic emitError(const Twine &message={})
Emit an error about fatal conditions with this operation, reporting up to any diagnostic handlers tha...
Definition: Operation.cpp:268

mlir::Operation::getBlock
Block * getBlock()
Returns the operation block that contains this operation.
Definition: Operation.h:213

mlir::Operation::getParentOfType
OpTy getParentOfType()
Return the closest surrounding parent operation that is of type 'OpTy'.
Definition: Operation.h:238

mlir::Operation::getRegions
MutableArrayRef< Region > getRegions()
Returns the regions held by this operation.
Definition: Operation.h:677

mlir::Operation::getResults
result_range getResults()
Definition: Operation.h:415

mlir::Operation::moveAfter
void moveAfter(Operation *existingOp)
Unlink this operation from its current block and insert it right after existingOp which may be in the...
Definition: Operation.cpp:569

mlir::PostDominanceInfo
A class for computing basic postdominance information.
Definition: Dominance.h:197

mlir::RegionBranchPoint::parent
static constexpr RegionBranchPoint parent()
Returns an instance of RegionBranchPoint representing the parent operation.
Definition: ControlFlowInterfaces.h:202

mlir::RegionSuccessor
This class represents a successor of a region.
Definition: ControlFlowInterfaces.h:165

mlir::RegionSuccessor::getSuccessorInputs
ValueRange getSuccessorInputs() const
Return the inputs to the successor that are remapped by the exit values of the current region.
Definition: ControlFlowInterfaces.h:186

mlir::RegionSuccessor::getSuccessor
Region * getSuccessor() const
Return the given region successor.
Definition: ControlFlowInterfaces.h:179

mlir::Region
This class contains a list of basic blocks and a link to the parent operation it is attached to.
Definition: Region.h:26

mlir::Region::getParentOp
Operation * getParentOp()
Return the parent operation this region is attached to.
Definition: Region.h:200

mlir::Region::empty
bool empty()
Definition: Region.h:60

mlir::Region::front
Block & front()
Definition: Region.h:65

mlir::SuccessorOperands
This class models how operands are forwarded to block arguments in control flow.
Definition: ControlFlowInterfaces.h:43

mlir::SuccessorOperands::slice
MutableOperandRange slice(unsigned subStart, unsigned subLen) const
Get a slice of the operands forwarded to the successor.
Definition: ControlFlowInterfaces.h:92

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

mlir::Value::getParentBlock
Block * getParentBlock()
Return the Block in which this Value is defined.
Definition: Value.cpp:48

mlir::Value::getLoc
Location getLoc() const
Return the location of this value.
Definition: Value.cpp:26

mlir::Value::getDefiningOp
Operation * getDefiningOp() const
If this value is the result of an operation, return the operation that defines it.
Definition: Value.cpp:20

mlir::WalkResult
A utility result that is used to signal how to proceed with an ongoing walk:
Definition: Visitors.h:33

mlir::WalkResult::wasSkipped
bool wasSkipped() const
Returns true if the walk was skipped.
Definition: Visitors.h:58

mlir::WalkResult::advance
static WalkResult advance()
Definition: Visitors.h:51

mlir::WalkResult::wasInterrupted
bool wasInterrupted() const
Returns true if the walk was interrupted.
Definition: Visitors.h:55

mlir::WalkResult::interrupt
static WalkResult interrupt()
Definition: Visitors.h:50

mlir::bufferization::BufferPlacementAllocs::AllocEntry
std::tuple< Value, Operation * > AllocEntry
Represents a tuple of allocValue and deallocOperation.
Definition: BufferUtils.h:37

mlir::bufferization::BufferPlacementTransformationBase
The base class for all BufferPlacement transformations.
Definition: BufferUtils.h:102

MemRef.h

mlir::bufferization
Definition: BufferDeallocationOpInterface.h:18

mlir::bufferization::findCommonDominator
Block * findCommonDominator(Value value, const BufferViewFlowAnalysis::ValueSetT &values, const DominatorT &doms)
Finds a common dominator for the given value while taking the positions of the values in the value se...
Definition: BufferUtils.h:81

mlir::bufferization::deallocateBuffers
LogicalResult deallocateBuffers(Operation *op)
Run buffer deallocation.
Definition: BufferDeallocation.cpp:651

mlir::bufferization::createBufferDeallocationPass
std::unique_ptr< Pass > createBufferDeallocationPass()
Creates an instance of the BufferDeallocation pass to free all allocated buffers.
Definition: BufferDeallocation.cpp:691

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::clone
Operation * clone(OpBuilder &b, Operation *op, TypeRange newResultTypes, ValueRange newOperands)
Definition: StructuredOpsUtils.cpp:197