doxygen/IterationGraphSorter_8cpp_source.html

 //===- IterationGraphSorter.cpp -------------------------------------------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #include "IterationGraphSorter.h"


 #include "mlir/Dialect/Linalg/IR/Linalg.h"

 #include "mlir/Dialect/SparseTensor/IR/SparseTensor.h"

 #include "mlir/Dialect/Utils/StructuredOpsUtils.h"

 #include "mlir/IR/AffineExprVisitor.h"

 #include "mlir/IR/BuiltinTypes.h"


 using namespace mlir;

 using namespace mlir::sparse_tensor;


 namespace {


 /// A helper class that visits an affine expression and tries to find

 /// an AffineDimExpr to which the corresponding iterator from a GenericOp

 /// matches the desired iterator type. If there is no matched iterator

 /// type, the method returns the first DimExpr in the expression.

 class AffineDimFinder : public AffineExprVisitor<AffineDimFinder> {

 public:

   explicit AffineDimFinder(ArrayRef<utils::IteratorType> itTypes)

       : iterTypes(itTypes) {}


   /// Overrides the visit method from AffineExprVisitor.

   void visitDimExpr(AffineDimExpr expr) {

     if (pickedDim == nullptr || pickIterType == iterTypes[expr.getPosition()])

       pickedDim = expr;

   }


   /// Sets the desired iterator type that we want to pick.

   void setPickedIterType(utils::IteratorType iterType) {

     pickIterType = iterType;

   }


   /// Gets the desired AffineDimExpr.

   AffineDimExpr getDimExpr() const {

     return llvm::cast<AffineDimExpr>(pickedDim);

   }


   /// Walks the graph in post order to find dim expr.

   void walkPostOrder(AffineExpr expr) {

     pickedDim = nullptr;

     AffineExprVisitor<AffineDimFinder>::walkPostOrder(expr);

   }


 private:

   /// The picked AffineDimExpr after visit.

   AffineExpr pickedDim;

   /// The iterator type that we want.

   utils::IteratorType pickIterType;

   /// The mapping between levels and iterator types.

   ArrayRef<utils::IteratorType> iterTypes;

 };


 /// Flattens an affine expression into a list of AffineDimExprs.

 struct AffineDimCollector : public AffineExprVisitor<AffineDimCollector> {

   // Overrides method from AffineExprVisitor.

   void visitDimExpr(AffineDimExpr expr) { dims.push_back(expr); }

   SmallVector<AffineDimExpr> dims;

 };


 } // namespace


 inline static bool includesAny(SortMask mask1, SortMask mask2) {

   return static_cast<unsigned>(mask1) & static_cast<unsigned>(mask2);

 }


 inline static bool includesDenseInput(SortMask mask) {

   return includesAny(mask, SortMask::kIncludeDenseInput);

 }


 inline static bool includesDenseOutput(SortMask mask) {

   return includesAny(mask, SortMask::kIncludeDenseOutput);

 }


 AffineMap IterationGraphSorter::topoSort() {

   // The sorted result will put the first Reduction iterator to the

   // latest possible position.

   std::vector<unsigned> redIt; // reduce iterator with 0 degree

   std::vector<unsigned> parIt; // parallel iterator with 0 degree

   const unsigned numLoops = getNumLoops();

   for (unsigned i = 0; i < numLoops; i++) {

     if (inDegree[i] == 0) {

       if (iterTypes[i] == utils::IteratorType::reduction)

         redIt.push_back(i);

       else

         parIt.push_back(i);

     }

   }


   SmallVector<unsigned> loopOrder;

   while (!redIt.empty() || !parIt.empty()) {

     // We always prefer a parallel loop over a reduction loop because putting

     // a reduction loop early might make the loop sequence inadmissible.

     auto &it = !parIt.empty() ? parIt : redIt;

     auto src = it.back();

     loopOrder.push_back(src);

     it.pop_back();

     // Update in-degree, and push 0-degree node into worklist.

     for (unsigned dst = 0; dst < numLoops; dst++) {

       if (itGraph[src][dst] && --inDegree[dst] == 0) {

         if (iterTypes[dst] == utils::IteratorType::reduction)

           redIt.push_back(dst);

         else

           parIt.push_back(dst);

       }

     }

   }


   // Return the topological sort on success.

   if (loopOrder.size() == numLoops)

     return AffineMap::getPermutationMap(loopOrder, out.getContext());


   // Cycle detected.

   return AffineMap();

 }


 IterationGraphSorter

 IterationGraphSorter::fromGenericOp(linalg::GenericOp genericOp) {

   // Must be a demapped sparse kernel.

   assert(!hasAnyNonIdentityOperandsOrResults(genericOp) &&

          hasAnySparseOperandOrResult(genericOp) &&

          genericOp.getNumDpsInits() == 1);


   SmallVector<AffineMap> loopMap = genericOp.getIndexingMapsArray();

   SmallVector<Value> ins = genericOp.getDpsInputs();


   AffineMap outMap = loopMap.back();

   loopMap.pop_back();


   Value out = genericOp.getDpsInitOperand(0)->get();

   SmallVector<utils::IteratorType> iterTypes =

       genericOp.getIteratorTypesArray();


   return IterationGraphSorter(std::move(ins), std::move(loopMap), out, outMap,

                               std::move(iterTypes));

 }


 IterationGraphSorter::IterationGraphSorter(

     SmallVector<Value> &&ins, SmallVector<AffineMap> &&loop2InsLvl, Value out,

     AffineMap loop2OutLvl, SmallVector<utils::IteratorType> &&iterTypes)

     : ins(std::move(ins)), loop2InsLvl(std::move(loop2InsLvl)), out(out),

       loop2OutLvl(loop2OutLvl), iterTypes(std::move(iterTypes)) {

   // One map per tensor.

   assert(loop2InsLvl.size() == ins.size());

   // All the affine maps have the same number of dimensions (loops).

   assert(llvm::all_equal(llvm::map_range(

       loop2InsLvl, [](AffineMap m) { return m.getNumDims(); })));

   // The number of results of the map should match the rank of the tensor.

   assert(llvm::all_of(llvm::zip(loop2InsLvl, ins), [](auto mvPair) {

     auto [m, v] = mvPair;

     return m.getNumResults() == cast<ShapedType>(v.getType()).getRank();

   }));


   itGraph.resize(getNumLoops(), std::vector<bool>(getNumLoops(), false));

   inDegree.resize(getNumLoops());

 }


 AffineMap IterationGraphSorter::sort(SortMask mask, Value ignored) {

   // Reset the adjacency matrix that represents the iteration graph.

   for (auto &row : itGraph)

     llvm::fill(row, false);


   // Reset in-degree.

   llvm::fill(inDegree, 0);


   // Add the constraints for the loop to level map.

   for (auto [in, map] : llvm::zip(ins, loop2InsLvl)) {

     // Get map and encoding.

     const auto enc = getSparseTensorEncoding(in.getType());

     // Skip dense inputs when not requested.

     if ((!enc && !includesDenseInput(mask)) || in == ignored)

       continue;

     addConstraints(in, map);

   }


   // Add the constraints for the output map.

   const auto enc = getSparseTensorEncoding(out.getType());

   if ((enc || includesDenseOutput(mask)) && out != ignored)

     addConstraints(out, loop2OutLvl);


   // Return the topological sort (empty for cyclic).

   return topoSort();

 }


 void IterationGraphSorter::addConstraints(Value t, AffineMap loop2LvlMap) {

   auto addIterOrdering = [this](unsigned f, unsigned t) {

     if (!itGraph[f][t] && f != t) {

       itGraph[f][t] = true;

       inDegree[t]++;

     }

   };


   // Set up a reduction finder.

   AffineDimFinder finder(iterTypes);

   finder.setPickedIterType(utils::IteratorType::reduction);


   // To compute iteration graph for tensor[d0 + d1 + d3, d4 + d5 + d6],

   // we require there exist d_x \in {d0, d1, d3} and d_y \in {d4, d5, d6},

   // and d_x > d_y && {d0, d1, d3} - d_x > {d4, d5, d6} - d_y

   const Level lvlRank = loop2LvlMap.getNumResults();

   for (Level lvl = 1; lvl < lvlRank; lvl++) {

     const AffineExpr fa = loop2LvlMap.getResult(lvl - 1);

     const AffineExpr ta = loop2LvlMap.getResult(lvl);


     if (llvm::isa<AffineDimExpr>(fa) || llvm::isa<AffineDimExpr>(ta)) {

       // Special case when at least one loop2LvlExp is a simple AffineDimExpr

       // (say, d0) and we require d0 > {d1, d2, ...} or {d1, d2, ...} > d0

       AffineDimCollector fCollector;

       fCollector.walkPostOrder(fa);

       AffineDimCollector tCollector;

       tCollector.walkPostOrder(ta);


       for (auto fd : fCollector.dims) {

         for (auto td : tCollector.dims) {

           const unsigned f = fd.getPosition();

           const unsigned t = td.getPosition();

           addIterOrdering(f, t);

         }

       }

       continue;

     }


     // When both loop2LvlExpr is compound, we pick an abitrary reduction loop

     // from lhs and rhs and use them as d_x and d_y.

     finder.walkPostOrder(fa);

     const AffineDimExpr fexp = finder.getDimExpr();

     const unsigned fldx = fexp.getPosition();


     finder.walkPostOrder(ta);

     const AffineDimExpr texp = finder.getDimExpr();

     const unsigned tldx = texp.getPosition();


     // d_x > d_y

     addIterOrdering(fldx, tldx);


     AffineDimCollector fCollector;

     fCollector.walkPostOrder(fa);

     AffineDimCollector tCollector;

     tCollector.walkPostOrder(ta);


     // Make sure dx and dy is the last.

     for (auto fd : fCollector.dims) {

       const unsigned f = fd.getPosition();

       addIterOrdering(f, fldx);

     }

     for (auto td : tCollector.dims) {

       const unsigned t = td.getPosition();

       addIterOrdering(t, tldx);

     }

     // {d0, d1, d3} - d_x > {d4, d5, d6} - d_y

     // This is to ensure that the affine expressions are reduced in sparse

     // tensor level ordering.

     for (auto fd : fCollector.dims) {

       const unsigned f = fd.getPosition();

       if (f == fldx) // skip d_x

         continue;

       for (auto td : tCollector.dims) {

         const unsigned t = td.getPosition();

         if (t == tldx) // skip d_y

           continue;

         addIterOrdering(f, t);

       }

     }

   }

 }

AffineExprVisitor.h

includesDenseOutput
static bool includesDenseOutput(SortMask mask)
Definition: IterationGraphSorter.cpp:79

includesAny
static bool includesAny(SortMask mask1, SortMask mask2)
Definition: IterationGraphSorter.cpp:71

includesDenseInput
static bool includesDenseInput(SortMask mask)
Definition: IterationGraphSorter.cpp:75

IterationGraphSorter.h

StructuredOpsUtils.h

llvm::ArrayRef
Definition: LLVM.h:48

llvm::SmallVector
Definition: LLVM.h:72

mlir::AffineDimExpr
A dimensional identifier appearing in an affine expression.
Definition: AffineExpr.h:223

mlir::AffineDimExpr::getPosition
unsigned getPosition() const
Definition: AffineExpr.cpp:346

mlir::AffineExprVisitor
See documentation for AffineExprVisitorBase.
Definition: AffineExprVisitor.h:144

mlir::AffineExprVisitor::walkPostOrder
RetTy walkPostOrder(AffineExpr expr)
Definition: AffineExprVisitor.h:150

mlir::AffineExpr
Base type for affine expression.
Definition: AffineExpr.h:68

mlir::AffineMap
A multi-dimensional affine map Affine map's are immutable like Type's, and they are uniqued.
Definition: AffineMap.h:46

mlir::AffineMap::getNumDims
unsigned getNumDims() const
Definition: AffineMap.cpp:390

mlir::AffineMap::getNumResults
unsigned getNumResults() const
Definition: AffineMap.cpp:398

mlir::AffineMap::getResult
AffineExpr getResult(unsigned idx) const
Definition: AffineMap.cpp:407

mlir::AffineMap::getPermutationMap
static AffineMap getPermutationMap(ArrayRef< unsigned > permutation, MLIRContext *context)
Returns an AffineMap representing a permutation.
Definition: AffineMap.cpp:260

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

mlir::Value::getContext
MLIRContext * getContext() const
Utility to get the associated MLIRContext that this value is defined in.
Definition: Value.h:108

mlir::Value::getType
Type getType() const
Return the type of this value.
Definition: Value.h:105

mlir::sparse_tensor::IterationGraphSorter
Definition: IterationGraphSorter.h:42

mlir::sparse_tensor::IterationGraphSorter::getNumLoops
unsigned getNumLoops() const
Returns the number of loops in the iteration graph.
Definition: IterationGraphSorter.h:54

mlir::sparse_tensor::IterationGraphSorter::fromGenericOp
static IterationGraphSorter fromGenericOp(linalg::GenericOp genericOp)
Factory method that construct an iteration graph sorter for the given linalg.generic operation.
Definition: IterationGraphSorter.cpp:126

mlir::sparse_tensor::IterationGraphSorter::sort
AffineMap sort(SortMask mask, Value ignored=nullptr)
Returns a permutation that represents the scheduled loop order.
Definition: IterationGraphSorter.cpp:166

Linalg.h

SparseTensor.h

BuiltinTypes.h

mlir::sparse_tensor
Definition: Enums.h:41

mlir::sparse_tensor::hasAnySparseOperandOrResult
bool hasAnySparseOperandOrResult(Operation *op)
Returns true iff MLIR operand has any sparse operand or result.
Definition: SparseTensor.h:196

mlir::sparse_tensor::Level
uint64_t Level
The type of level identifiers and level-ranks.
Definition: SparseTensor.h:42

mlir::sparse_tensor::getSparseTensorEncoding
SparseTensorEncodingAttr getSparseTensorEncoding(Type type)
Convenience method to get a sparse encoding attribute from a type.
Definition: SparseTensorDialect.cpp:1033

mlir::sparse_tensor::hasAnyNonIdentityOperandsOrResults
bool hasAnyNonIdentityOperandsOrResults(Operation *op)
Returns true iff MLIR operation has any sparse tensor with non-identity dim2lvl maps.
Definition: SparseTensorDialect.cpp:1171

mlir::sparse_tensor::SortMask
SortMask
Iteration graph sorting mask,.
Definition: IterationGraphSorter.h:32

mlir::sparse_tensor::SortMask::kIncludeDenseInput
@ kIncludeDenseInput

mlir::sparse_tensor::SortMask::kIncludeDenseOutput
@ kIncludeDenseOutput

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20