doxygen/Merger_8cpp_source.html

 //===- Merger.cpp - Implementation of iteration lattices ------------------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Dialect/SparseTensor/Utils/Merger.h"

 #include "mlir/Dialect/Arith/IR/Arith.h"

 #include "mlir/Dialect/Complex/IR/Complex.h"

 #include "mlir/Dialect/Math/IR/Math.h"

 #include "mlir/Dialect/SparseTensor/IR/SparseTensor.h"


 #include "mlir/IR/Operation.h"

 #include "llvm/Support/Debug.h"

 #include <optional>


 namespace mlir {

 namespace sparse_tensor {


 enum class ExpArity {

   kNullary,

   kUnary,

   kBinary,

 };


 static ExpArity getExpArity(TensorExp::Kind k) {

   switch (k) {

   // Leaf.

   case TensorExp::Kind::kTensor:

   case TensorExp::Kind::kInvariant:

   case TensorExp::Kind::kLoopVar:

   case TensorExp::Kind::kSynZero:

     return ExpArity::kNullary;

   case TensorExp::Kind::kAbsF:

   case TensorExp::Kind::kAbsC:

   case TensorExp::Kind::kAbsI:

   case TensorExp::Kind::kCeilF:

   case TensorExp::Kind::kFloorF:

   case TensorExp::Kind::kSqrtF:

   case TensorExp::Kind::kSqrtC:

   case TensorExp::Kind::kExpm1F:

   case TensorExp::Kind::kExpm1C:

   case TensorExp::Kind::kLog1pF:

   case TensorExp::Kind::kLog1pC:

   case TensorExp::Kind::kRelu:

   case TensorExp::Kind::kSinF:

   case TensorExp::Kind::kSinC:

   case TensorExp::Kind::kTanhF:

   case TensorExp::Kind::kTanhC:

   case TensorExp::Kind::kTruncF:

   case TensorExp::Kind::kExtF:

   case TensorExp::Kind::kCastFS:

   case TensorExp::Kind::kCastFU:

   case TensorExp::Kind::kCastSF:

   case TensorExp::Kind::kCastUF:

   case TensorExp::Kind::kCastS:

   case TensorExp::Kind::kCastU:

   case TensorExp::Kind::kCastIdx:

   case TensorExp::Kind::kTruncI:

   case TensorExp::Kind::kCIm:

   case TensorExp::Kind::kCRe:

   case TensorExp::Kind::kBitCast:

   case TensorExp::Kind::kBinaryBranch:

   case TensorExp::Kind::kUnary:

   case TensorExp::Kind::kSelect:

   case TensorExp::Kind::kNegF:

   case TensorExp::Kind::kNegC:

   case TensorExp::Kind::kNegI:

     return ExpArity::kUnary;

   // Binary operations.

   case TensorExp::Kind::kDivF:

   case TensorExp::Kind::kDivC:

   case TensorExp::Kind::kDivS:

   case TensorExp::Kind::kDivU:

   case TensorExp::Kind::kShrS:

   case TensorExp::Kind::kShrU:

   case TensorExp::Kind::kShlI:

   case TensorExp::Kind::kMulF:

   case TensorExp::Kind::kMulC:

   case TensorExp::Kind::kMulI:

   case TensorExp::Kind::kAndI:

   case TensorExp::Kind::kAddF:

   case TensorExp::Kind::kAddC:

   case TensorExp::Kind::kAddI:

   case TensorExp::Kind::kOrI:

   case TensorExp::Kind::kXorI:

   case TensorExp::Kind::kBinary:

   case TensorExp::Kind::kReduce:

   case TensorExp::Kind::kSubF:

   case TensorExp::Kind::kSubC:

   case TensorExp::Kind::kSubI:

   case TensorExp::Kind::kCmpF:

   case TensorExp::Kind::kCmpI:

   case TensorExp::Kind::kDenseOp: // kDenseOp can *at most* have two operands

     return ExpArity::kBinary;

   }

   llvm_unreachable("unexpected kind");

 }


 //===----------------------------------------------------------------------===//

 // Constructors.

 //===----------------------------------------------------------------------===//


 TensorExp::TensorExp(TensorExp::Kind k, unsigned x, ExprId y, Value v,

                      Operation *o, Attribute a)

     : kind(k), val(v), op(o), attr(a) {

   switch (kind) {

   // Leaf.

   case TensorExp::Kind::kTensor:

     assert(x != detail::kInvalidId && y == detail::kInvalidId && !v && !o);

     tensor = x;

     return;

   case TensorExp::Kind::kSynZero:

     assert(x == detail::kInvalidId && y == detail::kInvalidId && !v && !o);

     return;

   case TensorExp::Kind::kInvariant:

     assert(x == detail::kInvalidId && y == detail::kInvalidId && v && !o);

     return;

   case TensorExp::Kind::kLoopVar:

     assert(x != detail::kInvalidId && y == detail::kInvalidId && !v && !o);

     loop = x;

     return;

   // Unary operations.

   case TensorExp::Kind::kAbsF:

   case TensorExp::Kind::kAbsC:

   case TensorExp::Kind::kAbsI:

   case TensorExp::Kind::kCeilF:

   case TensorExp::Kind::kFloorF:

   case TensorExp::Kind::kSqrtF:

   case TensorExp::Kind::kSqrtC:

   case TensorExp::Kind::kExpm1F:

   case TensorExp::Kind::kExpm1C:

   case TensorExp::Kind::kLog1pF:

   case TensorExp::Kind::kLog1pC:

   case TensorExp::Kind::kRelu:

   case TensorExp::Kind::kSinF:

   case TensorExp::Kind::kSinC:

   case TensorExp::Kind::kTanhF:

   case TensorExp::Kind::kTanhC:

   case TensorExp::Kind::kNegF:

   case TensorExp::Kind::kNegC:

   case TensorExp::Kind::kNegI:

   case TensorExp::Kind::kCIm:

   case TensorExp::Kind::kCRe:

     assert(x != detail::kInvalidId && y == detail::kInvalidId && !v && !o);

     children.e0 = x;

     children.e1 = y;

     return;

   case TensorExp::Kind::kTruncF:

   case TensorExp::Kind::kExtF:

   case TensorExp::Kind::kCastFS:

   case TensorExp::Kind::kCastFU:

   case TensorExp::Kind::kCastSF:

   case TensorExp::Kind::kCastUF:

   case TensorExp::Kind::kCastS:

   case TensorExp::Kind::kCastU:

   case TensorExp::Kind::kCastIdx:

   case TensorExp::Kind::kTruncI:

   case TensorExp::Kind::kBitCast:

     assert(x != detail::kInvalidId && y == detail::kInvalidId && v && !o);

     children.e0 = x;

     children.e1 = y;

     return;

   case TensorExp::Kind::kBinaryBranch:

   case TensorExp::Kind::kSelect:

     assert(x != detail::kInvalidId && y == detail::kInvalidId && !v && o);

     children.e0 = x;

     children.e1 = y;

     return;

   case TensorExp::Kind::kUnary:

     // No assertion on y can be made, as the branching paths involve both

     // a unary (`mapSet`) and binary (`disjSet`) pathway.

     assert(x != detail::kInvalidId && !v && o);

     children.e0 = x;

     children.e1 = y;

     return;

   // Binary operations.

   case TensorExp::Kind::kMulF:

   case TensorExp::Kind::kMulC:

   case TensorExp::Kind::kMulI:

   case TensorExp::Kind::kDivF:

   case TensorExp::Kind::kDivC:

   case TensorExp::Kind::kDivS:

   case TensorExp::Kind::kDivU:

   case TensorExp::Kind::kAddF:

   case TensorExp::Kind::kAddC:

   case TensorExp::Kind::kAddI:

   case TensorExp::Kind::kSubF:

   case TensorExp::Kind::kSubC:

   case TensorExp::Kind::kSubI:

   case TensorExp::Kind::kAndI:

   case TensorExp::Kind::kOrI:

   case TensorExp::Kind::kXorI:

   case TensorExp::Kind::kShrS:

   case TensorExp::Kind::kShrU:

   case TensorExp::Kind::kShlI:

     assert(x != detail::kInvalidId && y != detail::kInvalidId && !v && !o);

     children.e0 = x;

     children.e1 = y;

     return;

   case TensorExp::Kind::kCmpF:

   case TensorExp::Kind::kCmpI:

     assert(x != detail::kInvalidId && y != detail::kInvalidId && !v && !o);

     children.e0 = x;

     children.e1 = y;

     return;

   case TensorExp::Kind::kBinary:

   case TensorExp::Kind::kReduce:

     assert(x != detail::kInvalidId && y != detail::kInvalidId && !v && o);

     children.e0 = x;

     children.e1 = y;

     return;

   case TensorExp::Kind::kDenseOp:

     assert(x != detail::kInvalidId && !v && o);

     children.e0 = x;

     children.e1 = y;

     return;

   }

   llvm_unreachable("unexpected kind");

 }


 Merger::Merger(unsigned numInputOutputTensors, unsigned numLoops,

                unsigned maxLvlRank)

     : outTensor(numInputOutputTensors - 1),

       syntheticTensor(numInputOutputTensors),

       numTensors(numInputOutputTensors + 1), numLoops(numLoops),

       hasSparseOut(false),

       lvlTypes(numTensors,

                std::vector<LevelType>(numLoops, LevelFormat::Undef)),

       loopToLvl(numTensors,

                 std::vector<std::optional<Level>>(numLoops, std::nullopt)),

       lvlToLoop(numTensors,

                 std::vector<std::optional<LoopId>>(maxLvlRank, std::nullopt)),

       loopToUnresolvedLvls(numLoops, std::vector<std::optional<LvlLTPair>>(

                                          numTensors, std::nullopt)),

       levelToDependentLoop(numTensors,

                            std::vector<std::vector<LoopCoeffPair>>(

                                maxLvlRank, std::vector<LoopCoeffPair>())),

       loopBounds(numLoops, std::make_pair(numTensors, numLoops)) {}


 //===----------------------------------------------------------------------===//

 // Lattice methods.

 //===----------------------------------------------------------------------===//


 ExprId Merger::addTensorExp(TensorId t) {

   assert(isValidTensorId(t));

   const ExprId eNew(tensorExps.size());

   tensorExps.emplace_back(TensorExp::Kind::kTensor, t, detail::kInvalidId,

                           Value(), nullptr, nullptr);

   return eNew;

 }


 ExprId Merger::addLoopVarExp(LoopId i) {

   assert(isValidLoopId(i));

   const ExprId eNew(tensorExps.size());

   tensorExps.emplace_back(TensorExp::Kind::kLoopVar, i, detail::kInvalidId,

                           Value(), nullptr, nullptr);

   return eNew;

 }


 ExprId Merger::addInvariantExp(Value v) {

   const ExprId eNew(tensorExps.size());

   tensorExps.emplace_back(TensorExp::Kind::kInvariant, detail::kInvalidId,

                           detail::kInvalidId, v, nullptr, nullptr);

   return eNew;

 }


 ExprId Merger::addSynZeroExp() {

   const ExprId eNew(tensorExps.size());

   tensorExps.emplace_back(TensorExp::Kind::kSynZero, detail::kInvalidId,

                           detail::kInvalidId, Value(), nullptr, nullptr);

   return eNew;

 }


 ExprId Merger::addExp(TensorExp::Kind k, ExprId e0, ExprId e1, Operation *op,

                       Attribute attr) {

   assert(k > TensorExp::Kind::kLoopVar);

   const ExprId eNew(tensorExps.size());

   tensorExps.emplace_back(k, e0, e1, Value(), op, attr);

   return eNew;

 }


 ExprId Merger::addExp(TensorExp::Kind k, ExprId e, Value v, Operation *op,

                       Attribute attr) {

   assert(k > TensorExp::Kind::kLoopVar);

   const ExprId eNew(tensorExps.size());

   tensorExps.emplace_back(k, e, detail::kInvalidId, v, op, attr);

   return eNew;

 }


 LatPointId Merger::addLat(TensorId t, LoopId i, ExprId e) {

   const LatPointId pNew(latPoints.size());

   const unsigned size = numLoops * numTensors;

   const TensorLoopId b = makeTensorLoopId(t, i);

   latPoints.emplace_back(size, e);

   latPoints[pNew].bits.set(b);

   return pNew;

 }


 LatPointId Merger::addLat(const BitVector &bits, ExprId e) {

   assert(bits.size() == numLoops * numTensors);

   const LatPointId pNew(latPoints.size());

   latPoints.emplace_back(bits, e);

   return pNew;

 }


 LatSetId Merger::addSet() {

   const LatSetId sNew(latSets.size());

   latSets.emplace_back();

   return sNew;

 }


 LatPointId Merger::conjLat(ExprId e, LatPointId p0, LatPointId p1,

                            Operation *op) {

   TensorExp::Kind kind = exp(e).kind;

   Attribute attr = exp(e).attr;

   const LatPointId pNew(latPoints.size());

   const auto &point0 = lat(p0);

   const auto &point1 = lat(p1);

   BitVector bits(point0.bits);

   bits |= point1.bits;

   const ExprId ne = addExp(kind, point0.exp, point1.exp, op, attr);

   latPoints.emplace_back(bits, ne);

   return pNew;

 }


 LatSetId Merger::conjSet(ExprId e, LatSetId s0, LatSetId s1, Operation *op) {

   const LatSetId sNew = addSet();

   auto &setNew = latSets[sNew];

   for (const LatPointId p0 : set(s0))

     for (const LatPointId p1 : set(s1))

       setNew.push_back(conjLat(e, p0, p1, op));

   return sNew;

 }


 LatSetId Merger::disjSet(ExprId e, LatSetId s0, LatSetId s1, Operation *op) {

   const LatSetId sNew = conjSet(e, s0, s1, op);

   TensorExp::Kind kind = exp(e).kind;

   // Followed by all in s0.

   latSets[sNew].append(latSets[s0]);

   // Map binary 0-y to unary -y.

   // TODO: move this if-else logic into buildLattices

   if (kind == TensorExp::Kind::kSubF)

     s1 = mapSet(TensorExp::Kind::kNegF, s1);

   else if (kind == TensorExp::Kind::kSubC)

     s1 = mapSet(TensorExp::Kind::kNegC, s1);

   else if (kind == TensorExp::Kind::kSubI)

     s1 = mapSet(TensorExp::Kind::kNegI, s1);

   // Followed by all in s1.

   latSets[sNew].append(latSets[s1]);

   return sNew;

 }


 LatSetId Merger::disjSetWithZero(ExprId e, LatSetId s0, LatSetId s1) {

   assert(exp(e).kind == TensorExp::Kind::kCmpI ||

          exp(e).kind == TensorExp::Kind::kCmpF);

   const LatSetId sNew = conjSet(e, s0, s1, nullptr);


   ExprId e0 = exp(e).children.e0;

   ExprId e1 = exp(e).children.e1;

   if (exp(e0).kind == TensorExp::Kind::kSynZero ||

       exp(e1).kind == TensorExp::Kind::kSynZero) {

     // lhs and rhs can't be synthetic zero at the same time.

     assert(exp(e0).kind != exp(e1).kind);

     // If one of the operands has already been assigned to zero (the

     // element is absent in the corresponding operand), then we do not

     // need to build disjunctive set for it.

     return sNew;

   }


   auto lhsSet = mapBinWithSynZeroSet(e, s0, false);

   auto rhsSet = mapBinWithSynZeroSet(e, s1, true);

   latSets[sNew].append(latSets[lhsSet]);

   latSets[sNew].append(latSets[rhsSet]);

   return sNew;

 }


 LatSetId Merger::combiSet(ExprId e, LatSetId s0, LatSetId s1, Operation *orig,

                           bool includeLeft, TensorExp::Kind ltrans,

                           Operation *opleft, bool includeRight,

                           TensorExp::Kind rtrans, Operation *opright) {

   Attribute a = exp(e).attr;

   const LatSetId sNew = conjSet(e, s0, s1, orig);

   // Left Region.

   if (includeLeft) {

     if (opleft)

       s0 = mapSet(ltrans, s0, Value(), opleft, a);

     latSets[sNew].append(latSets[s0]);

   }

   // Right Region.

   if (includeRight) {

     if (opright)

       s1 = mapSet(rtrans, s1, Value(), opright, a);

     latSets[sNew].append(latSets[s1]);

   }

   return sNew;

 }


 LatSetId Merger::mapSet(TensorExp::Kind kind, LatSetId s0, Value v,

                         Operation *op, Attribute a) {

   assert((TensorExp::Kind::kAbsF <= kind && kind <= TensorExp::Kind::kSelect) ||

          TensorExp::Kind::kDenseOp == kind);

   const LatSetId sNew = addSet();

   auto &setNew = latSets[sNew];

   for (const LatPointId p : set(s0)) {

     const auto &point = latPoints[p];

     setNew.push_back(addLat(point.bits, addExp(kind, point.exp, v, op, a)));

   }

   return sNew;

 }


 LatSetId Merger::mapBinWithSynZeroSet(ExprId e, LatSetId s0, bool lhsZero) {

   TensorExp::Kind kind = exp(e).kind;

   Attribute a = exp(e).attr;

   assert(TensorExp::Kind::kMulF <= kind && kind <= TensorExp::Kind::kShlI);

   // Must be a binary operation.

   const LatSetId sNew = addSet();

   auto &setNew = latSets[sNew];

   const ExprId zeroExp = addSynZeroExp();

   for (const LatPointId p : set(s0)) {

     const auto &point = latPoints[p];

     ExprId newExp = lhsZero ? addExp(kind, zeroExp, point.exp, nullptr, a)

                             : addExp(kind, point.exp, zeroExp, nullptr, a);

     setNew.push_back(addLat(point.bits, newExp));

   }

   return sNew;

 }


 LatSetId Merger::optimizeSet(LatSetId s0) {

   const LatSetId sNew = addSet();

   auto &setNew = latSets[sNew];

   const auto &set0 = set(s0);

   assert(!set0.empty());

   const LatPointId p0 = set0[0];

   for (const LatPointId p1 : set0) {

     bool add = true;

     if (p0 != p1) {

       // Check whether this is a straightforward copy.

       if (expIsTensor(latPoints[p1].exp, outTensor))

         continue;

       // Check whether this conjunction is already covered.

       for (const LatPointId p2 : setNew) {

         assert(!latGT(p1, p2)); // Lj => Li would be bad

         if (onlyDenseDiff(p2, p1)) {

           add = false;

           break;

         }

       }

       assert(!add || latGT(p0, p1));

     }

     if (add)

       setNew.push_back(p1);

   }

   for (const LatPointId p : setNew)

     latPoints[p].simple = simplifyCond(sNew, p);

   return sNew;

 }


 BitVector Merger::simplifyCond(LatSetId s0, LatPointId p0) {

   // First determine if this lattice point is a *singleton*, i.e.,

   // the last point in a lattice, no other is less than this one.

   bool isSingleton = true;

   for (const LatPointId p1 : set(s0)) {

     if (p0 != p1 && latGT(p0, p1)) {

       isSingleton = false;

       break;

     }

   }


   BitVector simple(latPoints[p0].bits);

   bool reset = isSingleton && hasAnySparse(simple);

   const TensorLoopId be = simple.size();

   TensorLoopId offset = 0; // relative to the end

   if (!reset)

     // Starts resetting from a dense level, so that the first bit (if kept)

     // is not undefined level-type.

     for (unsigned b = 0; b < be; b++) {

       if (simple[b] && getLvlType(TensorLoopId{b}).hasDenseSemantic()) {

         offset = be - b - 1; // relative to the end

         break;

       }

     }


   // Now apply the two basic rules. We also iterate the bits reversely to always

   // keep the rightmost bit (which could possibly be a synthetic tensor).

   for (unsigned b = be - 1 - offset, i = 0; i < be;

        b = b == 0 ? be - 1 : b - 1, i++) {

     // Slice on dense level has `locate` property as well, and can be optimized.

     if (simple[b] && !isSparseLvlWithNonTrivialIdxExp(b)) {

       const auto lt = getLvlType(b);

       if (!lt.hasSparseSemantic()) {

         if (reset)

           simple.reset(b);

         reset = true;

       }

     }

   }

   return simple;

 }


 bool Merger::latGT(LatPointId i, LatPointId j) const {

   const BitVector &bitsi = lat(i).bits;

   const BitVector &bitsj = lat(j).bits;

   assert(bitsi.size() == bitsj.size());

   if (bitsi.count() > bitsj.count()) {

     for (TensorLoopId b = 0, be = bitsj.size(); b < be; b++)

       if (bitsj[b] && !bitsi[b])

         return false;

     return true;

   }

   return false;

 }


 bool Merger::onlyDenseDiff(LatPointId i, LatPointId j) const {

   BitVector tmp(latPoints[j].bits);

   tmp ^= latPoints[i].bits;

   return !hasAnySparse(tmp);

 }


 bool Merger::expContainsTensor(ExprId e, TensorId t) const {

   const auto &expr = exp(e);

   // First we check `expIsTensor`.

   if (expr.kind == TensorExp::Kind::kTensor)

     return expr.tensor == t;


   switch (getExpArity(expr.kind)) {

   case ExpArity::kNullary:

     return false;

   case ExpArity::kUnary: {

     const ExprId e0 = expr.children.e0;

     return expContainsTensor(e0, t);

   }

   case ExpArity::kBinary: {

     const ExprId e0 = expr.children.e0;

     const ExprId e1 = expr.children.e1;

     return expContainsTensor(e0, t) || expContainsTensor(e1, t);

   }

   }

   llvm_unreachable("unexpected arity");

 }


 bool Merger::hasNegateOnOut(ExprId e) const {

   const auto &expr = exp(e);

   switch (expr.kind) {

   case TensorExp::Kind::kNegF:

   case TensorExp::Kind::kNegC:

   case TensorExp::Kind::kNegI:

     return expContainsTensor(expr.children.e0, outTensor);

   case TensorExp::Kind::kSubF:

   case TensorExp::Kind::kSubC:

   case TensorExp::Kind::kSubI:

     return expContainsTensor(expr.children.e1, outTensor) ||

            hasNegateOnOut(expr.children.e0);

   case TensorExp::Kind::kDenseOp: {

     bool lhsNeg = hasNegateOnOut(expr.children.e0);

     if (!lhsNeg && expr.children.e1 != detail::kInvalidId)

       return hasNegateOnOut(expr.children.e1);

     return lhsNeg;

   }

   default: {

     switch (getExpArity(expr.kind)) {

     case ExpArity::kNullary:

       return false;

     case ExpArity::kUnary:

       return hasNegateOnOut(expr.children.e0);

     case ExpArity::kBinary:

       return hasNegateOnOut(expr.children.e0) ||

              hasNegateOnOut(expr.children.e1);

     }

   }

   }

   llvm_unreachable("unexpected kind");

 }


 bool Merger::isSingleCondition(TensorId t, ExprId e) const {

   assert(isValidTensorId(t));

   const auto &expr = exp(e);

   switch (expr.kind) {

   // Leaf.

   case TensorExp::Kind::kTensor:

     return expr.tensor == t;

   case TensorExp::Kind::kInvariant:

   case TensorExp::Kind::kLoopVar:

   case TensorExp::Kind::kSynZero:

     return false;

   // Unary operations.

   case TensorExp::Kind::kAbsF:

   case TensorExp::Kind::kAbsC:

   case TensorExp::Kind::kAbsI:

   case TensorExp::Kind::kCeilF:

   case TensorExp::Kind::kFloorF:

   case TensorExp::Kind::kSqrtF:

   case TensorExp::Kind::kSqrtC:

   case TensorExp::Kind::kExpm1F:

   case TensorExp::Kind::kExpm1C:

   case TensorExp::Kind::kLog1pF:

   case TensorExp::Kind::kLog1pC:

   case TensorExp::Kind::kRelu:

   case TensorExp::Kind::kSinF:

   case TensorExp::Kind::kSinC:

   case TensorExp::Kind::kTanhF:

   case TensorExp::Kind::kTanhC:

   case TensorExp::Kind::kNegF:

   case TensorExp::Kind::kNegC:

   case TensorExp::Kind::kNegI:

   case TensorExp::Kind::kTruncF:

   case TensorExp::Kind::kExtF:

   case TensorExp::Kind::kCastFS:

   case TensorExp::Kind::kCastFU:

   case TensorExp::Kind::kCastSF:

   case TensorExp::Kind::kCastUF:

   case TensorExp::Kind::kCastS:

   case TensorExp::Kind::kCastU:

   case TensorExp::Kind::kCastIdx:

   case TensorExp::Kind::kTruncI:

   case TensorExp::Kind::kCIm:

   case TensorExp::Kind::kCRe:

   case TensorExp::Kind::kBitCast:

   case TensorExp::Kind::kUnary:

     return isSingleCondition(t, expr.children.e0);

   case TensorExp::Kind::kBinaryBranch:

   case TensorExp::Kind::kSelect:

     return false;

   // Binary operations.

   case TensorExp::Kind::kDivF: // note: x / c only

   case TensorExp::Kind::kDivC:

   case TensorExp::Kind::kDivS:

   case TensorExp::Kind::kDivU:

     assert(!maybeZero(expr.children.e1));

     return isSingleCondition(t, expr.children.e0);

   case TensorExp::Kind::kShrS: // note: x >> inv only

   case TensorExp::Kind::kShrU:

   case TensorExp::Kind::kShlI:

     assert(isInvariant(expr.children.e1));

     return isSingleCondition(t, expr.children.e0);

   case TensorExp::Kind::kMulF:

   case TensorExp::Kind::kMulC:

   case TensorExp::Kind::kMulI:

   case TensorExp::Kind::kAndI:

   case TensorExp::Kind::kReduce:

     if (isSingleCondition(t, expr.children.e0))

       return isSingleCondition(t, expr.children.e1) ||

              isInvariant(expr.children.e1);

     if (isSingleCondition(t, expr.children.e1))

       return isInvariant(expr.children.e0);

     return false;

   case TensorExp::Kind::kAddF:

   case TensorExp::Kind::kAddC:

   case TensorExp::Kind::kAddI:

     return isSingleCondition(t, expr.children.e0) &&

            isSingleCondition(t, expr.children.e1);

   case TensorExp::Kind::kSubF:

   case TensorExp::Kind::kSubC:

   case TensorExp::Kind::kSubI:

   case TensorExp::Kind::kOrI:

   case TensorExp::Kind::kXorI:

   case TensorExp::Kind::kCmpF:

   case TensorExp::Kind::kCmpI:

   case TensorExp::Kind::kBinary:

     return false;

   case TensorExp::Kind::kDenseOp:

     // Since Merger guarantees all the operands of the kDenseOp to be dense, the

     // operation must be single-condition.

     return true;

   }

   llvm_unreachable("unexpected kind");

 }


 bool Merger::hasAnySparse(const BitVector &bits) const {

   for (TensorLoopId b : bits.set_bits()) {

     const auto lt = getLvlType(b);

     if (lt.hasSparseSemantic())

       return true;

   }

   return hasSparseIdxReduction(bits);

 }


 bool Merger::hasSparseIdxReduction(const BitVector &bits) const {

   for (TensorLoopId b : bits.set_bits())

     if (isSparseLvlWithNonTrivialIdxExp(b))

       return true;

   return false;

 }


 #ifndef NDEBUG


 //===----------------------------------------------------------------------===//

 // Print methods (for debugging).

 //===----------------------------------------------------------------------===//


 static const char *kindToOpSymbol(TensorExp::Kind kind) {

   switch (kind) {

   // Leaf.

   case TensorExp::Kind::kTensor:

     return "tensor";

   case TensorExp::Kind::kInvariant:

     return "invariant";

   case TensorExp::Kind::kLoopVar:

     return "index";

   case TensorExp::Kind::kSynZero:

     return "0";

   // Unary operations.

   case TensorExp::Kind::kAbsF:

   case TensorExp::Kind::kAbsC:

   case TensorExp::Kind::kAbsI:

     return "abs";

   case TensorExp::Kind::kCeilF:

     return "ceil";

   case TensorExp::Kind::kFloorF:

     return "floor";

   case TensorExp::Kind::kSqrtF:

   case TensorExp::Kind::kSqrtC:

     return "sqrt";

   case TensorExp::Kind::kExpm1F:

   case TensorExp::Kind::kExpm1C:

     return "expm1";

   case TensorExp::Kind::kLog1pF:

   case TensorExp::Kind::kLog1pC:

     return "log1p";

   case TensorExp::Kind::kRelu:

     return "relu";

   case TensorExp::Kind::kSinF:

   case TensorExp::Kind::kSinC:

     return "sin";

   case TensorExp::Kind::kTanhF:

   case TensorExp::Kind::kTanhC:

     return "tanh";

   case TensorExp::Kind::kNegF:

   case TensorExp::Kind::kNegC:

   case TensorExp::Kind::kNegI:

     return "-";

   case TensorExp::Kind::kTruncF:

   case TensorExp::Kind::kExtF:

   case TensorExp::Kind::kCastFS:

   case TensorExp::Kind::kCastFU:

   case TensorExp::Kind::kCastSF:

   case TensorExp::Kind::kCastUF:

   case TensorExp::Kind::kCastS:

   case TensorExp::Kind::kCastU:

   case TensorExp::Kind::kCastIdx:

   case TensorExp::Kind::kTruncI:

   case TensorExp::Kind::kCIm:

     return "complex.im";

   case TensorExp::Kind::kCRe:

     return "complex.re";

   case TensorExp::Kind::kBitCast:

     return "cast";

   case TensorExp::Kind::kBinaryBranch:

     return "binary_branch";

   case TensorExp::Kind::kUnary:

     return "unary";

   case TensorExp::Kind::kSelect:

     return "select";

   // Binary operations.

   case TensorExp::Kind::kMulF:

   case TensorExp::Kind::kMulC:

   case TensorExp::Kind::kMulI:

     return "*";

   case TensorExp::Kind::kDivF:

   case TensorExp::Kind::kDivC:

   case TensorExp::Kind::kDivS:

   case TensorExp::Kind::kDivU:

     return "/";

   case TensorExp::Kind::kAddF:

   case TensorExp::Kind::kAddC:

   case TensorExp::Kind::kAddI:

     return "+";

   case TensorExp::Kind::kSubF:

   case TensorExp::Kind::kSubC:

   case TensorExp::Kind::kSubI:

     return "-";

   case TensorExp::Kind::kAndI:

     return "&";

   case TensorExp::Kind::kOrI:

     return "|";

   case TensorExp::Kind::kXorI:

     return "^";

   case TensorExp::Kind::kShrS:

     return "a>>";

   case TensorExp::Kind::kShrU:

     return ">>";

   case TensorExp::Kind::kShlI:

     return "<<";

   case TensorExp::Kind::kCmpF:

   case TensorExp::Kind::kCmpI:

     return "cmp";

   case TensorExp::Kind::kBinary:

     return "binary";

   case TensorExp::Kind::kReduce:

     return "reduce";

   case TensorExp::Kind::kDenseOp:

     return "dense";

   }

   llvm_unreachable("unexpected kind for symbol");

 }


 void Merger::dumpExp(ExprId e) const {

   const auto &expr = exp(e);

   switch (expr.kind) {

   // Leaf.

   case TensorExp::Kind::kTensor:

     if (expr.tensor == syntheticTensor)

       llvm::dbgs() << "synthetic_";

     else if (expr.tensor == outTensor)

       llvm::dbgs() << "output_";

     llvm::dbgs() << "tensor_" << expr.tensor;

     break;

   case TensorExp::Kind::kInvariant:

     llvm::dbgs() << "invariant";

     break;

   case TensorExp::Kind::kSynZero:

     llvm::dbgs() << "0";

     break;

   case TensorExp::Kind::kLoopVar:

     llvm::dbgs() << "loopvar_" << expr.loop;

     break;

   // Unary operations.

   case TensorExp::Kind::kAbsF:

   case TensorExp::Kind::kAbsC:

   case TensorExp::Kind::kAbsI:

   case TensorExp::Kind::kCeilF:

   case TensorExp::Kind::kFloorF:

   case TensorExp::Kind::kSqrtF:

   case TensorExp::Kind::kSqrtC:

   case TensorExp::Kind::kExpm1F:

   case TensorExp::Kind::kExpm1C:

   case TensorExp::Kind::kLog1pF:

   case TensorExp::Kind::kLog1pC:

   case TensorExp::Kind::kRelu:

   case TensorExp::Kind::kSinF:

   case TensorExp::Kind::kSinC:

   case TensorExp::Kind::kTanhF:

   case TensorExp::Kind::kTanhC:

   case TensorExp::Kind::kNegF:

   case TensorExp::Kind::kNegC:

   case TensorExp::Kind::kNegI:

   case TensorExp::Kind::kTruncF:

   case TensorExp::Kind::kExtF:

   case TensorExp::Kind::kCastFS:

   case TensorExp::Kind::kCastFU:

   case TensorExp::Kind::kCastSF:

   case TensorExp::Kind::kCastUF:

   case TensorExp::Kind::kCastS:

   case TensorExp::Kind::kCastU:

   case TensorExp::Kind::kCastIdx:

   case TensorExp::Kind::kTruncI:

   case TensorExp::Kind::kCIm:

   case TensorExp::Kind::kCRe:

   case TensorExp::Kind::kBitCast:

   case TensorExp::Kind::kBinaryBranch:

   case TensorExp::Kind::kUnary:

   case TensorExp::Kind::kSelect:

     llvm::dbgs() << kindToOpSymbol(expr.kind) << " ";

     dumpExp(expr.children.e0);

     break;

   // Binary operations.

   case TensorExp::Kind::kMulF:

   case TensorExp::Kind::kMulC:

   case TensorExp::Kind::kMulI:

   case TensorExp::Kind::kDivF:

   case TensorExp::Kind::kDivC:

   case TensorExp::Kind::kDivS:

   case TensorExp::Kind::kDivU:

   case TensorExp::Kind::kAddF:

   case TensorExp::Kind::kAddC:

   case TensorExp::Kind::kAddI:

   case TensorExp::Kind::kSubF:

   case TensorExp::Kind::kSubC:

   case TensorExp::Kind::kSubI:

   case TensorExp::Kind::kAndI:

   case TensorExp::Kind::kOrI:

   case TensorExp::Kind::kXorI:

   case TensorExp::Kind::kShrS:

   case TensorExp::Kind::kShrU:

   case TensorExp::Kind::kShlI:

   case TensorExp::Kind::kCmpF:

   case TensorExp::Kind::kCmpI:

   case TensorExp::Kind::kBinary:

   case TensorExp::Kind::kReduce:

   case TensorExp::Kind::kDenseOp:

     llvm::dbgs() << "(";

     dumpExp(expr.children.e0);

     llvm::dbgs() << " " << kindToOpSymbol(expr.kind);

     if (expr.attr)

       llvm::dbgs() << "{" << expr.attr << "}";

     if (expr.children.e1 != detail::kInvalidId) {

       llvm::dbgs() << " ";

       dumpExp(expr.children.e1);

       llvm::dbgs() << ")";

     } else {

       assert(expr.kind == TensorExp::Kind::kDenseOp);

     }

     break;

   }

 }


 void Merger::dumpLat(LatPointId p) const {

   const auto &point = lat(p);

   llvm::dbgs() << "lat(";

   dumpBits(point.bits);

   llvm::dbgs() << " :";

   dumpBits(point.simple);

   llvm::dbgs() << " : ";

   dumpExp(point.exp);

   llvm::dbgs() << " )\n";

 }


 void Merger::dumpSet(LatSetId s) const {

   const auto &ss = set(s);

   llvm::dbgs() << "{ #" << ss.size() << "\n";

   for (const LatPointId p : ss) {

     llvm::dbgs() << "  ";

     dumpLat(p);

   }

   llvm::dbgs() << "}\n";

 }


 void Merger::dumpBits(const BitVector &bits) const {

   for (TensorLoopId b = 0, be = bits.size(); b < be; b++) {

     if (bits[b]) {

       const TensorId t = tensor(b);

       const LoopId i = loop(b);

       const auto lt = lvlTypes[t][i];

       if (isLvlWithNonTrivialIdxExp(b))

         llvm::dbgs() << " DEP_" << t << "_" << i;

       else

         llvm::dbgs() << " i_" << t << "_" << i << "_" << toMLIRString(lt);

     }

   }

 }


 #endif // NDEBUG


 //===----------------------------------------------------------------------===//

 // Builder methods.

 //===----------------------------------------------------------------------===//


 LatSetId Merger::buildLattices(ExprId e, LoopId i) {

   // NOTE: The `expr` reference will be invalidated by recursive calls

   // (and any other method that may add new expressions); therefore, the

   // code below must make sure to copy fields of `expr` into local variables

   // before making any recursive calls.

   const auto &expr = exp(e);

   const TensorExp::Kind kind = expr.kind;

   switch (kind) {

   // Leaf.

   case TensorExp::Kind::kTensor:

   case TensorExp::Kind::kInvariant:

   case TensorExp::Kind::kSynZero:

   case TensorExp::Kind::kLoopVar: {

     // Either the loop-var is really used in the tensor expression, or it is

     // set to the undefined loop-var in that level. An invariant expression,

     // a proper index value, and a truly dynamic sparse output tensor are set

     // to a synthetic tensor with undefined indices only to ensure the

     // iteration space is not skipped as a result of their contents.

     const LatSetId s = addSet();

     TensorId t = syntheticTensor;

     if (kind == TensorExp::Kind::kTensor) {

       t = expr.tensor;

       if (hasSparseOut && t == outTensor)

         t = syntheticTensor;

     }

     latSets[s].push_back(addLat(t, i, e));

     return s;

   }

   // Unary operations.

   case TensorExp::Kind::kAbsF:

   case TensorExp::Kind::kAbsC:

   case TensorExp::Kind::kAbsI:

   case TensorExp::Kind::kCeilF:

   case TensorExp::Kind::kFloorF:

   case TensorExp::Kind::kSqrtF:

   case TensorExp::Kind::kSqrtC:

   case TensorExp::Kind::kExpm1F:

   case TensorExp::Kind::kExpm1C:

   case TensorExp::Kind::kLog1pF:

   case TensorExp::Kind::kLog1pC:

   case TensorExp::Kind::kRelu:

   case TensorExp::Kind::kSinF:

   case TensorExp::Kind::kSinC:

   case TensorExp::Kind::kTanhF:

   case TensorExp::Kind::kTanhC:

   case TensorExp::Kind::kNegF:

   case TensorExp::Kind::kNegC:

   case TensorExp::Kind::kNegI:

   case TensorExp::Kind::kTruncF:

   case TensorExp::Kind::kExtF:

   case TensorExp::Kind::kCastFS:

   case TensorExp::Kind::kCastFU:

   case TensorExp::Kind::kCastSF:

   case TensorExp::Kind::kCastUF:

   case TensorExp::Kind::kCastS:

   case TensorExp::Kind::kCastU:

   case TensorExp::Kind::kCastIdx:

   case TensorExp::Kind::kTruncI:

   case TensorExp::Kind::kCIm:

   case TensorExp::Kind::kCRe:

   case TensorExp::Kind::kBitCast:

     // A zero preserving operation (viz. f(0) = 0, [Bik96,Ch5]) maps the

     // lattice set of the operand through the operator into a new set.

     //

     //  -y|!y | y |

     //  --+---+---+

     //    | 0 |-y |

     {

       const ExprId e0 = expr.children.e0;

       const Value v = expr.val;

       Attribute a = expr.attr;

       return mapSet(kind, buildLattices(e0, i), v, nullptr, a);

     }

   case TensorExp::Kind::kBinaryBranch:

   case TensorExp::Kind::kSelect:

     // The left or right half of a binary operation which has already

     // been split into separate operations for each region.

     {

       const ExprId e0 = expr.children.e0;

       Operation *const op = expr.op;

       return mapSet(kind, buildLattices(e0, i), Value(), op);

     }

   case TensorExp::Kind::kUnary:

     // A custom unary operation.

     //

     //  op y|    !y    |     y      |

     //  ----+----------+------------+

     //      | absent() | present(y) |

     {

       const ExprId e0 = expr.children.e0;

       UnaryOp unop = cast<UnaryOp>(expr.op);

       const LatSetId child0 = buildLattices(e0, i);

       Region &absentRegion = unop.getAbsentRegion();

       if (absentRegion.empty()) {

         // Simple mapping over existing values.

         return mapSet(kind, child0, Value(), unop);

       }

       // Use a disjunction with `unop` on the left and the absent value as an

       // invariant on the right.

       Block &absentBlock = absentRegion.front();

       YieldOp absentYield = cast<YieldOp>(absentBlock.getTerminator());

       const Value absentVal = absentYield.getSingleResult();

       const ExprId rhs = addInvariantExp(absentVal);

       return disjSet(e, child0, buildLattices(rhs, i), unop);

     }

   // Binary operations.

   case TensorExp::Kind::kMulF:

   case TensorExp::Kind::kMulC:

   case TensorExp::Kind::kMulI:

   case TensorExp::Kind::kAndI:

     // A multiplicative operation only needs to be performed

     // for the conjunction of sparse iteration spaces.

     //

     //  x*y|!y | y |

     //  ---+---+---+

     //  !x | 0 | 0 |

     //   x | 0 |x*y|

     //

     // Note even here, 0*NaN=NaN and 0*Inf=NaN, but that is ignored.

     {

       const ExprId e0 = expr.children.e0;

       const ExprId e1 = expr.children.e1;

       return conjSet(e, buildLattices(e0, i), buildLattices(e1, i));

     }

   case TensorExp::Kind::kDivF:

   case TensorExp::Kind::kDivC:

   case TensorExp::Kind::kDivS:

   case TensorExp::Kind::kDivU:

     // A division is tricky, since 0/0, 0/c, c/0 all have

     // specific outcomes for floating-point and integers.

     // Thus, we need to traverse the full iteration space.

     //

     //  x/y|!y | y |

     //  ---+---+---+

     //  !x |0/0|0/y|   FP: 0/0=NaN,c/0=Inf,0/c=0 with c true nonzero

     //   x |x/0|x/y|  INT: x/0=exception for any x

     //

     // TODO: for now we "fixed" this by only accepting x/c cases

     //       during expression building, so that the conjunction

     //       rules applies (viz. x/c = x*(1/c) as far as lattice

     //       construction is concerned).

     {

       const ExprId e0 = expr.children.e0;

       const ExprId e1 = expr.children.e1;

       assert(!maybeZero(e1));

       return conjSet(e, buildLattices(e0, i), buildLattices(e1, i));

     }

   case TensorExp::Kind::kAddF:

   case TensorExp::Kind::kAddC:

   case TensorExp::Kind::kAddI:

   case TensorExp::Kind::kSubF:

   case TensorExp::Kind::kSubC:

   case TensorExp::Kind::kSubI:

   case TensorExp::Kind::kOrI:

   case TensorExp::Kind::kXorI:

     // An additive operation needs to be performed

     // for the disjunction of sparse iteration spaces.

     //

     //  x+y|!y | y |    x-y|!y | y |

     //  ---+---+---+    ---+---+---+

     //  !x | 0 | y |    !x | 0 |-y |

     //   x | x |x+y|     x | x |x-y|

     {

       const ExprId e0 = expr.children.e0;

       const ExprId e1 = expr.children.e1;

       return disjSet(e, buildLattices(e0, i), buildLattices(e1, i));

     }

   case TensorExp::Kind::kCmpF:

   case TensorExp::Kind::kCmpI:

     // A comparison operation needs to be performed

     // for the disjunction of sparse iteration spaces.

     //

     //   x < y |  !y   |   y   |

     //  -------+-------+-------+

     //     !x  |   0   | 0 < y |

     //      x  | x < 0 | x < y |

     {

       const ExprId e0 = expr.children.e0;

       const ExprId e1 = expr.children.e1;

       return disjSetWithZero(e, buildLattices(e0, i), buildLattices(e1, i));

     }

   case TensorExp::Kind::kShrS:

   case TensorExp::Kind::kShrU:

   case TensorExp::Kind::kShlI:

     // A shift operation by an invariant amount (viz. tensor expressions

     // can only occur at the left-hand-side of the operator) can be handled

     // with the conjunction rule.

     {

       const ExprId e0 = expr.children.e0;

       const ExprId e1 = expr.children.e1;

       assert(isInvariant(e1));

       return conjSet(e, buildLattices(e0, i), buildLattices(e1, i));

     }

   case TensorExp::Kind::kBinary:

     // A custom binary operation.

     //

     //  x op y|   !y    |       y      |

     //  ------+---------+--------------+

     //    !x  |  empty  |   right(y)   |

     //     x  | left(x) | overlap(x,y) |

     {

       const ExprId e0 = expr.children.e0;

       const ExprId e1 = expr.children.e1;

       BinaryOp binop = cast<BinaryOp>(expr.op);

       const LatSetId child0 = buildLattices(e0, i);

       const LatSetId child1 = buildLattices(e1, i);

       Region &leftRegion = binop.getLeftRegion();

       Region &rightRegion = binop.getRightRegion();

       // Left Region.

       Operation *leftYield = nullptr;

       if (!leftRegion.empty()) {

         Block &leftBlock = leftRegion.front();

         leftYield = leftBlock.getTerminator();

       }

       // Right Region.

       Operation *rightYield = nullptr;

       if (!rightRegion.empty()) {

         Block &rightBlock = rightRegion.front();

         rightYield = rightBlock.getTerminator();

       }

       bool includeLeft = binop.getLeftIdentity() || !leftRegion.empty();

       bool includeRight = binop.getRightIdentity() || !rightRegion.empty();

       return combiSet(e, child0, child1, binop, includeLeft,

                       TensorExp::Kind::kBinaryBranch, leftYield, includeRight,

                       TensorExp::Kind::kBinaryBranch, rightYield);

     }

   case TensorExp::Kind::kReduce:

     // A custom reduce operation.

     {

       const ExprId e0 = expr.children.e0;

       const ExprId e1 = expr.children.e1;

       Operation *const op = expr.op;

       return conjSet(e, buildLattices(e0, i), buildLattices(e1, i), op);

     }

   case TensorExp::Kind::kDenseOp: {

     // It does not really matter whether we use conjunctive/disjunctive set

     // here, as all the operands of kDenseOp must be dense, the disjunctive set

     // will be optimized into conjunctive set eventually.

     if (expr.children.e1 == detail::kInvalidId) {

       const ExprId e0 = expr.children.e0;

       Operation *const op = expr.op;

       return mapSet(kind, buildLattices(e0, i), Value(), op);

     }


     const ExprId e0 = expr.children.e0;

     const ExprId e1 = expr.children.e1;

     Operation *const op = expr.op;

     return conjSet(e, buildLattices(e0, i), buildLattices(e1, i), op);

   }

   }

   llvm_unreachable("unexpected expression kind");

 }


 std::optional<ExprId> Merger::buildTensorExpFromLinalg(linalg::GenericOp op) {

   // Build the linalg semantics backward from yield.

   Operation *yield = op.getRegion().front().getTerminator();

   assert(isa<linalg::YieldOp>(yield));

   return buildTensorExp(op, yield->getOperand(0)).first;

 }


 /// Only returns true if we are certain this is a zero.

 static bool isCertainZero(Value val) {

   if (auto c = val.getDefiningOp<complex::ConstantOp>()) {

     ArrayAttr arrayAttr = c.getValue();

     return cast<FloatAttr>(arrayAttr[0]).getValue().isZero() &&

            cast<FloatAttr>(arrayAttr[1]).getValue().isZero();

   }

   if (auto c = val.getDefiningOp<arith::ConstantIntOp>())

     return c.value() == 0;

   if (auto c = val.getDefiningOp<arith::ConstantFloatOp>())

     return c.value().isZero();

   return false;

 }


 /// Only returns false if we are certain this is a nonzero.

 bool Merger::maybeZero(ExprId e) const {

   const auto &expr = exp(e);

   if (expr.kind == TensorExp::Kind::kInvariant) {

     // Note that this is different from isCertainZero() in a subtle

     // way by always returning true for non-constants.

     if (auto c = expr.val.getDefiningOp<complex::ConstantOp>()) {

       ArrayAttr arrayAttr = c.getValue();

       return cast<FloatAttr>(arrayAttr[0]).getValue().isZero() &&

              cast<FloatAttr>(arrayAttr[1]).getValue().isZero();

     }

     if (auto c = expr.val.getDefiningOp<arith::ConstantIntOp>())

       return c.value() == 0;

     if (auto c = expr.val.getDefiningOp<arith::ConstantFloatOp>())

       return c.value().isZero();

   }

   return true;

 }


 Type Merger::inferType(ExprId e, Value src) const {

   // Obtain the destination type from the cast node.

   Type dtp = exp(e).val.getType();

   // Inspect source type. For vector types, apply the same

   // vectorization to the destination type.

   if (auto vtp = dyn_cast<VectorType>(src.getType()))

     return VectorType::get(vtp.getNumElements(), dtp, vtp.getScalableDims());

   return dtp;

 }


 /// Ensures that the sparsifier can generate code for expression.

 static bool isAdmissibleBranchExp(Operation *op, Block *block, Value v) {

   // Arguments are always admissible.

   if (isa<BlockArgument>(v))

     return true;

   // Accept index anywhere.

   Operation *def = v.getDefiningOp();

   if (isa<linalg::IndexOp>(def))

     return true;

   // Operation defined outside branch.

   if (def->getBlock() != block)

     return def->getBlock() != op->getBlock(); // invariant?

   // Operation defined within branch. Anything is accepted,

   // as long as all subexpressions are admissible.

   for (unsigned i = 0, n = def->getNumOperands(); i < n; i++)

     if (!isAdmissibleBranchExp(op, block, def->getOperand(i)))

       return false;

   return true;

 }


 /// Ensures that the sparsifier can generate code for branch.

 static bool isAdmissibleBranch(Operation *op, Region &region) {

   if (region.empty())

     return true;

   // Build the semi-ring branch semantics backward from yield.

   Operation *yield = region.front().getTerminator();

   assert(isa<YieldOp>(yield));

   return isAdmissibleBranchExp(op, &region.front(), yield->getOperand(0));

 }


 // Recognizes a direct GT comparison.

 static bool isGreater(TensorExp::Kind kind, Attribute attr) {

   if (kind == TensorExp::Kind::kCmpI) {

     auto pred = llvm::cast<arith::CmpIPredicateAttr>(attr).getValue();

     return pred == arith::CmpIPredicate::ugt ||

            pred == arith::CmpIPredicate::sgt;

   }

   if (kind == TensorExp::Kind::kCmpF) {

     auto pred = llvm::cast<arith::CmpFPredicateAttr>(attr).getValue();

     return pred == arith::CmpFPredicate::UGT ||

            pred == arith::CmpFPredicate::OGT;

   }

   return false;

 }


 std::pair<std::optional<ExprId>, bool>

 Merger::buildTensorExp(linalg::GenericOp op, Value v) {

   // Recursion leaves.

   if (auto arg = dyn_cast<BlockArgument>(v)) {

     const TensorId tid = makeTensorId(arg.getArgNumber());

     // Any argument of the generic op that is not marked as a scalar

     // argument is considered a tensor, indexed by the implicit loop

     // bounds. This includes rank-0 tensor arguments.

     if (arg.getOwner()->getParentOp() == op) {

       OpOperand &t = op->getOpOperand(tid);

       bool hasSpDep = getSparseTensorEncoding(t.get().getType()) != nullptr;

       if (!op.isScalar(&t))

         return {addTensorExp(tid), hasSpDep};

       v = t.get(); // get scalar value

     }

     // Any other argument (marked as scalar argument for the generic op

     // or belonging to an enveloping op) is considered invariant.

     return {addInvariantExp(v), /*hasSpDep=*/false};

   }


   // Something defined outside is invariant.

   Operation *def = v.getDefiningOp();

   if (def->getBlock() != &op.getRegion().front())

     return {addInvariantExp(v), /*hasSpDep=*/false};

   // Construct index operations.

   if (def->getNumOperands() == 0) {

     if (auto indexOp = dyn_cast<linalg::IndexOp>(def))

       return {addLoopVarExp(makeLoopId(indexOp.getDim())), /*hasSpDep=*/false};

   }


   // Construct unary operations if subexpression can be built.

   if (def->getNumOperands() == 1) {

     const auto [x, hasSpDep] = buildTensorExp(op, def->getOperand(0));

     if (x.has_value()) {

       const ExprId e = *x;

       if (isa<math::AbsFOp>(def))

         return {addExp(TensorExp::Kind::kAbsF, e), hasSpDep};

       if (isa<complex::AbsOp>(def))

         return {addExp(TensorExp::Kind::kAbsC, e), hasSpDep};

       if (isa<math::AbsIOp>(def))

         return {addExp(TensorExp::Kind::kAbsI, e), hasSpDep};

       if (isa<math::CeilOp>(def))

         return {addExp(TensorExp::Kind::kCeilF, e), hasSpDep};

       if (isa<math::FloorOp>(def))

         return {addExp(TensorExp::Kind::kFloorF, e), hasSpDep};

       if (isa<math::SqrtOp>(def))

         return {addExp(TensorExp::Kind::kSqrtF, e), hasSpDep};

       if (isa<complex::SqrtOp>(def))

         return {addExp(TensorExp::Kind::kSqrtC, e), hasSpDep};

       if (isa<math::ExpM1Op>(def))

         return {addExp(TensorExp::Kind::kExpm1F, e), hasSpDep};

       if (isa<complex::Expm1Op>(def))

         return {addExp(TensorExp::Kind::kExpm1C, e), hasSpDep};

       if (isa<math::Log1pOp>(def))

         return {addExp(TensorExp::Kind::kLog1pF, e), hasSpDep};

       if (isa<complex::Log1pOp>(def))

         return {addExp(TensorExp::Kind::kLog1pC, e), hasSpDep};

       if (isa<math::SinOp>(def))

         return {addExp(TensorExp::Kind::kSinF, e), hasSpDep};

       if (isa<complex::SinOp>(def))

         return {addExp(TensorExp::Kind::kSinC, e), hasSpDep};

       if (isa<math::TanhOp>(def))

         return {addExp(TensorExp::Kind::kTanhF, e), hasSpDep};

       if (isa<complex::TanhOp>(def))

         return {addExp(TensorExp::Kind::kTanhC, e), hasSpDep};

       if (isa<arith::NegFOp>(def))

         return {addExp(TensorExp::Kind::kNegF, e), hasSpDep}; // no negi in std

       if (isa<complex::NegOp>(def))

         return {addExp(TensorExp::Kind::kNegC, e), hasSpDep};

       if (isa<arith::TruncFOp>(def))

         return {addExp(TensorExp::Kind::kTruncF, e, v), hasSpDep};

       if (isa<arith::ExtFOp>(def))

         return {addExp(TensorExp::Kind::kExtF, e, v), hasSpDep};

       if (isa<arith::FPToSIOp>(def))

         return {addExp(TensorExp::Kind::kCastFS, e, v), hasSpDep};

       if (isa<arith::FPToUIOp>(def))

         return {addExp(TensorExp::Kind::kCastFU, e, v), hasSpDep};

       if (isa<arith::SIToFPOp>(def))

         return {addExp(TensorExp::Kind::kCastSF, e, v), hasSpDep};

       if (isa<arith::UIToFPOp>(def))

         return {addExp(TensorExp::Kind::kCastUF, e, v), hasSpDep};

       if (isa<arith::ExtSIOp>(def))

         return {addExp(TensorExp::Kind::kCastS, e, v), hasSpDep};

       if (isa<arith::ExtUIOp>(def))

         return {addExp(TensorExp::Kind::kCastU, e, v), hasSpDep};

       if (isa<arith::IndexCastOp>(def))

         return {addExp(TensorExp::Kind::kCastIdx, e, v), hasSpDep};

       if (isa<arith::TruncIOp>(def))

         return {addExp(TensorExp::Kind::kTruncI, e, v), hasSpDep};

       if (isa<complex::ImOp>(def))

         return {addExp(TensorExp::Kind::kCIm, e), hasSpDep};

       if (isa<complex::ReOp>(def))

         return {addExp(TensorExp::Kind::kCRe, e), hasSpDep};

       if (isa<arith::BitcastOp>(def))

         return {addExp(TensorExp::Kind::kBitCast, e, v), hasSpDep};

       if (auto unop = dyn_cast<sparse_tensor::UnaryOp>(def)) {

         if (isAdmissibleBranch(unop, unop.getPresentRegion()) &&

             isAdmissibleBranch(unop, unop.getAbsentRegion()))

           return {addExp(TensorExp::Kind::kUnary, e, Value(), def), hasSpDep};

       }

       if (auto selop = dyn_cast<sparse_tensor::SelectOp>(def)) {

         if (isAdmissibleBranch(selop, selop.getRegion()))

           return {addExp(TensorExp::Kind::kSelect, e, Value(), def), hasSpDep};

       }

     }

   }


   // Construct binary operations if subexpressions can be built.

   // See buildLattices() for an explanation of rejecting certain

   // division and shift operations.

   if (def->getNumOperands() == 2) {

     const auto [x, xSpVals] = buildTensorExp(op, def->getOperand(0));

     const auto [y, ySpVals] = buildTensorExp(op, def->getOperand(1));

     // For a conjunctive operation, it yields a "sparse" result if any operand

     // is sparse. For a disjunctive operation, it yields a "sparse" result if

     // all operands are sparse.

     bool conjSpVals = xSpVals || ySpVals;

     bool disjSpVals = xSpVals && ySpVals;

     if (x.has_value() && y.has_value()) {

       const ExprId e0 = *x;

       const ExprId e1 = *y;

       if (isa<arith::MulFOp>(def))

         return {addExp(TensorExp::Kind::kMulF, e0, e1), conjSpVals};

       if (isa<complex::MulOp>(def))

         return {addExp(TensorExp::Kind::kMulC, e0, e1), conjSpVals};

       if (isa<arith::MulIOp>(def))

         return {addExp(TensorExp::Kind::kMulI, e0, e1), conjSpVals};

       if (isa<arith::DivFOp>(def) && !maybeZero(e1))

         return {addExp(TensorExp::Kind::kDivF, e0, e1), conjSpVals};

       if (isa<complex::DivOp>(def) && !maybeZero(e1))

         return {addExp(TensorExp::Kind::kDivC, e0, e1), conjSpVals};

       if (isa<arith::DivSIOp>(def) && !maybeZero(e1))

         return {addExp(TensorExp::Kind::kDivS, e0, e1), conjSpVals};

       if (isa<arith::DivUIOp>(def) && !maybeZero(e1))

         return {addExp(TensorExp::Kind::kDivU, e0, e1), conjSpVals};

       if (isa<arith::AddFOp>(def))

         return {addExp(TensorExp::Kind::kAddF, e0, e1), disjSpVals};

       if (isa<complex::AddOp>(def))

         return {addExp(TensorExp::Kind::kAddC, e0, e1), disjSpVals};

       if (isa<arith::AddIOp>(def))

         return {addExp(TensorExp::Kind::kAddI, e0, e1), disjSpVals};

       if (isa<arith::SubFOp>(def))

         return {addExp(TensorExp::Kind::kSubF, e0, e1), disjSpVals};

       if (isa<complex::SubOp>(def))

         return {addExp(TensorExp::Kind::kSubC, e0, e1), disjSpVals};

       if (isa<arith::SubIOp>(def))

         return {addExp(TensorExp::Kind::kSubI, e0, e1), disjSpVals};

       if (isa<arith::AndIOp>(def))

         return {addExp(TensorExp::Kind::kAndI, e0, e1), conjSpVals};

       if (isa<arith::OrIOp>(def))

         return {addExp(TensorExp::Kind::kOrI, e0, e1), disjSpVals};

       if (isa<arith::XOrIOp>(def))

         return {addExp(TensorExp::Kind::kXorI, e0, e1), disjSpVals};

       if (isa<arith::ShRSIOp>(def) && isInvariant(e1))

         return {addExp(TensorExp::Kind::kShrS, e0, e1), conjSpVals};

       if (isa<arith::ShRUIOp>(def) && isInvariant(e1))

         return {addExp(TensorExp::Kind::kShrU, e0, e1), conjSpVals};

       if (isa<arith::ShLIOp>(def) && isInvariant(e1))

         return {addExp(TensorExp::Kind::kShlI, e0, e1), conjSpVals};

       if (auto ci = dyn_cast<arith::CmpIOp>(def)) {

         if (ci.getPredicate() == arith::CmpIPredicate::eq &&

             ci.getPredicate() == arith::CmpIPredicate::sle &&

             ci.getPredicate() == arith::CmpIPredicate::sge &&

             ci.getPredicate() == arith::CmpIPredicate::ule &&

             ci.getPredicate() == arith::CmpIPredicate::uge) {

           // We can not sparsify comparison with equal, this is because 0 <= 0

           // yields true, and thus densifies the result.

           return {std::nullopt, false};

         }


         auto e = addExp(TensorExp::Kind::kCmpI, e0, e1, nullptr,

                         ci.getPredicateAttr());

         return {e, conjSpVals};

       }

       if (auto cf = dyn_cast<arith::CmpFOp>(def)) {

         if (cf.getPredicate() == arith::CmpFPredicate::OEQ &&

             cf.getPredicate() == arith::CmpFPredicate::OGE &&

             cf.getPredicate() == arith::CmpFPredicate::OLE &&

             cf.getPredicate() == arith::CmpFPredicate::ONE &&

             cf.getPredicate() == arith::CmpFPredicate::UEQ &&

             cf.getPredicate() == arith::CmpFPredicate::UGE &&

             cf.getPredicate() == arith::CmpFPredicate::ULE &&

             cf.getPredicate() == arith::CmpFPredicate::ORD &&

             cf.getPredicate() == arith::CmpFPredicate::UNO) {

           // We can not sparsify comparison with equal, this is because 0 <= 0

           // yields true, and thus densifies the result.

           return {std::nullopt, false};

         }

         auto e = addExp(TensorExp::Kind::kCmpF, e0, e1, nullptr,

                         cf.getPredicateAttr());

         return {e, conjSpVals};

       }

       if (auto binop = dyn_cast<sparse_tensor::BinaryOp>(def)) {

         if (isAdmissibleBranch(binop, binop.getOverlapRegion()) &&

             (binop.getLeftIdentity() ||

              isAdmissibleBranch(binop, binop.getLeftRegion())) &&

             (binop.getRightIdentity() ||

              isAdmissibleBranch(binop, binop.getRightRegion())))

           return {addExp(TensorExp::Kind::kBinary, e0, e1, def), conjSpVals};

       }

     }

   }


   // Construct ternary operations if subexpressions can be built.

   if (def->getNumOperands() == 3) {

     const auto [x, xDepSp] = buildTensorExp(op, def->getOperand(0));

     const auto [y, yDepSp] = buildTensorExp(op, def->getOperand(1));

     const auto [z, zDepSp] = buildTensorExp(op, def->getOperand(2));

     bool hasSpDep = xDepSp || yDepSp || zDepSp;

     if (x.has_value() && y.has_value() && z.has_value()) {

       const ExprId e0 = *x;

       const ExprId e1 = *y;

       if (auto redop = dyn_cast<sparse_tensor::ReduceOp>(def)) {

         if (isAdmissibleBranch(redop, redop.getRegion()))

           return {addExp(TensorExp::Kind::kReduce, e0, e1, def), hasSpDep};

       }

       if (auto selop = dyn_cast<arith::SelectOp>(def)) {

         // Recognize an integral or floating-point ReLu(x) = Max(x, 0)

         // operation inside a very specific ternary select operation.

         // TODO: capture MIN/MAX/ABS/RELU structure in a more generic way

         const auto &cnd = exp(*x);

         if (isGreater(cnd.kind, cnd.attr) &&

             exp(*y).kind == TensorExp::Kind::kTensor &&

             exp(*z).kind == TensorExp::Kind::kInvariant &&

             isCertainZero(exp(*z).val)) {

           const auto &a = exp(cnd.children.e0);

           const auto &b = exp(cnd.children.e1);

           if (a.kind == TensorExp::Kind::kTensor &&

               a.tensor == exp(*y).tensor &&

               b.kind == TensorExp::Kind::kInvariant && isCertainZero(b.val)) {

             return {addExp(TensorExp::Kind::kRelu, *y, detail::kInvalidId,

                            nullptr, cnd.attr),

                     yDepSp};

           }

         }

       }

     }

   }


   // If we reach here, we are dealing with an operation that is not currently

   // sparsifiable. We can still generate code for it if all its operands only

   // have dense dependencies (i.e., all the values are loaded from dense

   // tensors).

   if (def->getNumResults() != 1) // only handle single result operation.

     return {std::nullopt, false};

   SmallVector<std::pair<std::optional<ExprId>, bool>, 2> subExp;

   // Builds all the sub-expressions

   for (Value operand : def->getOperands())

     subExp.push_back(buildTensorExp(op, operand));


   if (llvm::all_of(subExp,

                    [](auto e) { return e.first.has_value() && !e.second; })) {

     // All the subexpressions can be built and has *no* sparse dependencies.

     if (subExp.size() == 2) {

       auto e = addExp(TensorExp::Kind::kDenseOp, *subExp[0].first,

                       *subExp[1].first, def);

       return {e, false};

     }

     if (subExp.size() == 1) {

       auto e = addExp(TensorExp::Kind::kDenseOp, *subExp[0].first,

                       detail::kInvalidId, def);

       return {e, false};

     }

   }


   // Cannot build.

   return {std::nullopt, false};

 }


 static Value insertYieldOp(RewriterBase &rewriter, Location loc, Region &region,

                            ValueRange vals) {

   // Make a clone of overlap region.

   Region tmpRegion;

   IRMapping mapper;

   region.cloneInto(&tmpRegion, tmpRegion.begin(), mapper);

   Block &clonedBlock = tmpRegion.front();

   YieldOp clonedYield = cast<YieldOp>(clonedBlock.getTerminator());

   // Merge cloned block and return yield value.

   Operation *placeholder = arith::ConstantIndexOp::create(rewriter, loc, 0);

   rewriter.inlineBlockBefore(&tmpRegion.front(), placeholder, vals);

   Value val = clonedYield.getSingleResult();

   rewriter.eraseOp(clonedYield);

   rewriter.eraseOp(placeholder);

   return val;

 }


 static Value buildUnaryPresent(RewriterBase &rewriter, Location loc,

                                Operation *op, Value v0) {

   if (!v0)

     // Empty input value must be propagated.

     return Value();

   UnaryOp unop = cast<UnaryOp>(op);

   Region &presentRegion = unop.getPresentRegion();

   if (presentRegion.empty())

     // Uninitialized Value() will be interpreted as missing data in the

     // output.

     return Value();

   return insertYieldOp(rewriter, loc, presentRegion, {v0});

 }


 static Value buildBinaryOverlap(RewriterBase &rewriter, Location loc,

                                 Operation *op, Value v0, Value v1) {

   if (!v0 || !v1)

     // Empty input values must be propagated.

     return Value();

   BinaryOp binop = cast<BinaryOp>(op);

   Region &overlapRegion = binop.getOverlapRegion();

   if (overlapRegion.empty())

     // Uninitialized Value() will be interpreted as missing data in the

     // output.

     return Value();

   return insertYieldOp(rewriter, loc, overlapRegion, {v0, v1});

 }


 static Value buildRelu(RewriterBase &rewriter, Location loc, Value v0,

                        Attribute attr) {

   Type tp = v0.getType();

   auto zero =

       arith::ConstantOp::create(rewriter, loc, tp, rewriter.getZeroAttr(tp));

   Value cmp;

   if (isa<FloatType>(tp)) {

     auto pred = llvm::cast<arith::CmpFPredicateAttr>(attr);

     cmp = arith::CmpFOp::create(rewriter, loc, pred, v0, zero);

   } else {

     auto pred = llvm::cast<arith::CmpIPredicateAttr>(attr);

     cmp = arith::CmpIOp::create(rewriter, loc, pred, v0, zero);

   }

   return arith::SelectOp::create(rewriter, loc, cmp, v0, zero);

 }


 Value Merger::buildExp(RewriterBase &rewriter, Location loc, ExprId e, Value v0,

                        Value v1) const {

   const auto &expr = exp(e);

   switch (expr.kind) {

   // Leaf.

   case TensorExp::Kind::kTensor:

   case TensorExp::Kind::kInvariant:

   case TensorExp::Kind::kLoopVar:

   case TensorExp::Kind::kSynZero:

     llvm_unreachable("unexpected non-op");

   // Unary operations.

   case TensorExp::Kind::kAbsF:

     return math::AbsFOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kAbsC: {

     auto type = cast<ComplexType>(v0.getType());

     auto eltType = cast<FloatType>(type.getElementType());

     return complex::AbsOp::create(rewriter, loc, eltType, v0);

   }

   case TensorExp::Kind::kAbsI:

     return math::AbsIOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kCeilF:

     return math::CeilOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kFloorF:

     return math::FloorOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kSqrtF:

     return math::SqrtOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kSqrtC:

     return complex::SqrtOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kExpm1F:

     return math::ExpM1Op::create(rewriter, loc, v0);

   case TensorExp::Kind::kExpm1C:

     return complex::Expm1Op::create(rewriter, loc, v0);

   case TensorExp::Kind::kLog1pF:

     return math::Log1pOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kLog1pC:

     return complex::Log1pOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kRelu:

     return buildRelu(rewriter, loc, v0, expr.attr);

   case TensorExp::Kind::kSinF:

     return math::SinOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kSinC:

     return complex::SinOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kTanhF:

     return math::TanhOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kTanhC:

     return complex::TanhOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kNegF:

     return arith::NegFOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kNegC:

     return complex::NegOp::create(rewriter, loc, v0);

   case TensorExp::Kind::kNegI: // no negi in std

     return arith::SubIOp::create(

         rewriter, loc,

         arith::ConstantOp::create(rewriter, loc, v0.getType(),

                                   rewriter.getZeroAttr(v0.getType())),

         v0);

   case TensorExp::Kind::kTruncF:

     return arith::TruncFOp::create(rewriter, loc, inferType(e, v0), v0);

   case TensorExp::Kind::kExtF:

     return arith::ExtFOp::create(rewriter, loc, inferType(e, v0), v0);

   case TensorExp::Kind::kCastFS:

     return arith::FPToSIOp::create(rewriter, loc, inferType(e, v0), v0);

   case TensorExp::Kind::kCastFU:

     return arith::FPToUIOp::create(rewriter, loc, inferType(e, v0), v0);

   case TensorExp::Kind::kCastSF:

     return arith::SIToFPOp::create(rewriter, loc, inferType(e, v0), v0);

   case TensorExp::Kind::kCastUF:

     return arith::UIToFPOp::create(rewriter, loc, inferType(e, v0), v0);

   case TensorExp::Kind::kCastS:

     return arith::ExtSIOp::create(rewriter, loc, inferType(e, v0), v0);

   case TensorExp::Kind::kCastU:

     return arith::ExtUIOp::create(rewriter, loc, inferType(e, v0), v0);

   case TensorExp::Kind::kCastIdx:

     return arith::IndexCastOp::create(rewriter, loc, inferType(e, v0), v0);

   case TensorExp::Kind::kTruncI:

     return arith::TruncIOp::create(rewriter, loc, inferType(e, v0), v0);

   case TensorExp::Kind::kCIm: {

     auto type = cast<ComplexType>(v0.getType());

     auto eltType = cast<FloatType>(type.getElementType());

     return complex::ImOp::create(rewriter, loc, eltType, v0);

   }

   case TensorExp::Kind::kCRe: {

     auto type = cast<ComplexType>(v0.getType());

     auto eltType = cast<FloatType>(type.getElementType());

     return complex::ReOp::create(rewriter, loc, eltType, v0);

   }

   case TensorExp::Kind::kBitCast:

     return arith::BitcastOp::create(rewriter, loc, inferType(e, v0), v0);

   // Binary operations.

   case TensorExp::Kind::kMulF:

     return arith::MulFOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kMulC:

     return complex::MulOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kMulI:

     return arith::MulIOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kDivF:

     return arith::DivFOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kDivC:

     return complex::DivOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kDivS:

     return arith::DivSIOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kDivU:

     return arith::DivUIOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kAddF:

     return arith::AddFOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kAddC:

     return complex::AddOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kAddI:

     return arith::AddIOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kSubF:

     return arith::SubFOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kSubC:

     return complex::SubOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kSubI:

     return arith::SubIOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kAndI:

     return arith::AndIOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kOrI:

     return arith::OrIOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kXorI:

     return arith::XOrIOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kShrS:

     return arith::ShRSIOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kShrU:

     return arith::ShRUIOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kShlI:

     return arith::ShLIOp::create(rewriter, loc, v0, v1);

   case TensorExp::Kind::kCmpI: {

     auto predicate = llvm::cast<arith::CmpIPredicateAttr>(expr.attr);

     return arith::CmpIOp::create(rewriter, loc, predicate, v0, v1);

   }

   case TensorExp::Kind::kCmpF: {

     auto predicate = llvm::cast<arith::CmpFPredicateAttr>(expr.attr);

     return arith::CmpFOp::create(rewriter, loc, predicate, v0, v1);

   }

   case TensorExp::Kind::kBinaryBranch: // semi-ring ops with custom logic.

     return insertYieldOp(rewriter, loc, *expr.op->getBlock()->getParent(),

                          {v0});

   case TensorExp::Kind::kUnary:

     return buildUnaryPresent(rewriter, loc, expr.op, v0);

   case TensorExp::Kind::kSelect:

     return insertYieldOp(rewriter, loc,

                          cast<sparse_tensor::SelectOp>(expr.op).getRegion(),

                          {v0});

   case TensorExp::Kind::kBinary:

     return buildBinaryOverlap(rewriter, loc, expr.op, v0, v1);

   case TensorExp::Kind::kReduce: {

     ReduceOp redOp = cast<ReduceOp>(expr.op);

     return insertYieldOp(rewriter, loc, redOp.getRegion(), {v0, v1});

   }

   case TensorExp::Kind::kDenseOp: {

     Operation *actualOp = expr.op;

     IRMapping mapping;

     mapping.map(actualOp->getOperand(0), v0);

     if (actualOp->getNumOperands() == 2)

       mapping.map(actualOp->getOperand(1), v1);

     return rewriter.clone(*actualOp, mapping)->getResult(0);

   }

   }

   llvm_unreachable("unexpected expression kind in build");

 }


 } // namespace sparse_tensor

 } // namespace mlir

Complex.h

Operation.h

kind
union mlir::linalg::@1252::ArityGroupAndKind::Kind kind

Merger.h

mlir::Attribute
Attributes are known-constant values of operations.
Definition: Attributes.h:25

mlir::Block
Block represents an ordered list of Operations.
Definition: Block.h:33

mlir::Block::getTerminator
Operation * getTerminator()
Get the terminator operation of this block.
Definition: Block.cpp:244

mlir::Builder::getZeroAttr
TypedAttr getZeroAttr(Type type)
Definition: Builders.cpp:324

mlir::IRMapping
This is a utility class for mapping one set of IR entities to another.
Definition: IRMapping.h:26

mlir::IRMapping::map
void map(Value from, Value to)
Inserts a new mapping for 'from' to 'to'.
Definition: IRMapping.h:30

mlir::IROperand::get
IRValueT get() const
Return the current value being used by this operand.
Definition: UseDefLists.h:160

mlir::Location
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
Definition: Location.h:76

mlir::OpBuilder::clone
Operation * clone(Operation &op, IRMapping &mapper)
Creates a deep copy of the specified operation, remapping any operands that use values outside of the...
Definition: Builders.cpp:562

mlir::OpOperand
This class represents an operand of an operation.
Definition: Value.h:257

mlir::Operation
Operation is the basic unit of execution within MLIR.
Definition: Operation.h:88

mlir::Operation::getOperand
Value getOperand(unsigned idx)
Definition: Operation.h:350

mlir::Operation::getResult
OpResult getResult(unsigned idx)
Get the 'idx'th result of this operation.
Definition: Operation.h:407

mlir::Operation::getNumOperands
unsigned getNumOperands()
Definition: Operation.h:346

mlir::Operation::getBlock
Block * getBlock()
Returns the operation block that contains this operation.
Definition: Operation.h:213

mlir::Operation::getRegion
Region & getRegion(unsigned index)
Returns the region held by this operation at position 'index'.
Definition: Operation.h:686

mlir::Region
This class contains a list of basic blocks and a link to the parent operation it is attached to.
Definition: Region.h:26

mlir::Region::empty
bool empty()
Definition: Region.h:60

mlir::Region::cloneInto
void cloneInto(Region *dest, IRMapping &mapper)
Clone the internal blocks from this region into dest.
Definition: Region.cpp:70

mlir::Region::begin
iterator begin()
Definition: Region.h:55

mlir::Region::front
Block & front()
Definition: Region.h:65

mlir::RewriterBase
This class coordinates the application of a rewrite on a set of IR, providing a way for clients to tr...
Definition: PatternMatch.h:368

mlir::RewriterBase::eraseOp
virtual void eraseOp(Operation *op)
This method erases an operation that is known to have no uses.
Definition: PatternMatch.cpp:155

mlir::RewriterBase::inlineBlockBefore
virtual void inlineBlockBefore(Block *source, Block *dest, Block::iterator before, ValueRange argValues={})
Inline the operations of block 'source' into block 'dest' before the given position.
Definition: PatternMatch.cpp:290

mlir::Type
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
Definition: Types.h:74

mlir::ValueRange
This class provides an abstraction over the different types of ranges over Values.
Definition: ValueRange.h:387

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

mlir::Value::getType
Type getType() const
Return the type of this value.
Definition: Value.h:105

mlir::Value::getDefiningOp
Operation * getDefiningOp() const
If this value is the result of an operation, return the operation that defines it.
Definition: Value.cpp:18

mlir::arith::ConstantFloatOp
Specialization of arith.constant op that returns a floating point value.
Definition: Arith.h:92

mlir::arith::ConstantIndexOp::create
static ConstantIndexOp create(OpBuilder &builder, Location location, int64_t value)
Definition: ArithOps.cpp:359

mlir::arith::ConstantIntOp
Specialization of arith.constant op that returns an integer value.
Definition: Arith.h:54

mlir::sparse_tensor::Merger::conjLat
LatPointId conjLat(ExprId e, LatPointId p0, LatPointId p1, Operation *op=nullptr)
Computes a single conjunction of two lattice points by taking the "union" of LoopId (effectively cons...
Definition: Merger.cpp:315

mlir::sparse_tensor::Merger::disjSet
LatSetId disjSet(ExprId e, LatSetId s0, LatSetId s1, Operation *op=nullptr)
Disjunctive merge of two lattice sets: (s0 /\_op s1, s0, s1).
Definition: Merger.cpp:338

mlir::sparse_tensor::Merger::isSingleCondition
bool isSingleCondition(TensorId t, ExprId e) const
Returns true if given tensor iterates only in the given tensor expression.
Definition: Merger.cpp:577

mlir::sparse_tensor::Merger::hasSparseIdxReduction
bool hasSparseIdxReduction(const BitVector &bits) const
Returns true if bits contains a dependent index reduction condition on sparse levels.
Definition: Merger.cpp:680

mlir::sparse_tensor::Merger::expContainsTensor
bool expContainsTensor(ExprId e, TensorId t) const
Returns true if the expression contains the tensor as an operand.
Definition: Merger.cpp:522

mlir::sparse_tensor::Merger::mapBinWithSynZeroSet
LatSetId mapBinWithSynZeroSet(ExprId e, LatSetId s, bool lhsZero)
Maps the binary operator to the same operation but with one of its operand set to zero,...
Definition: Merger.cpp:414

mlir::sparse_tensor::Merger::isSparseLvlWithNonTrivialIdxExp
bool isSparseLvlWithNonTrivialIdxExp(TensorLoopId b) const
Checks whether the TensorLoopId represents a sparse tensor level contains non-trivial index expressio...
Definition: Merger.h:510

mlir::sparse_tensor::Merger::dumpBits
void dumpBits(const BitVector &bits) const
Definition: Merger.cpp:920

mlir::sparse_tensor::Merger::addSet
LatSetId addSet()
Constructs a new (initially empty) set, and returns its identifier.
Definition: Merger.cpp:309

mlir::sparse_tensor::Merger::simplifyCond
BitVector simplifyCond(LatSetId s, LatPointId p)
Simplifies the conditions in a conjunction of a given lattice point within the given set using just t...
Definition: Merger.cpp:461

mlir::sparse_tensor::Merger::hasNegateOnOut
bool hasNegateOnOut(ExprId e) const
Returns true if the expression contains a negation on output tensor.
Definition: Merger.cpp:544

mlir::sparse_tensor::Merger::isLvlWithNonTrivialIdxExp
bool isLvlWithNonTrivialIdxExp(TensorLoopId b) const
Checks whether the TensorLoopId represents a tensor level contains non-trivial index expression.
Definition: Merger.h:501

mlir::sparse_tensor::Merger::disjSetWithZero
LatSetId disjSetWithZero(ExprId e, LatSetId s0, LatSetId s1)
Disjunctive merge of two lattice sets and also set one of the operand to zero: (s0 /\_op s1 (e0 op e1...
Definition: Merger.cpp:356

mlir::sparse_tensor::Merger::dumpSet
void dumpSet(LatSetId s) const
Definition: Merger.cpp:910

mlir::sparse_tensor::Merger::dumpLat
void dumpLat(LatPointId p) const
Definition: Merger.cpp:899

mlir::sparse_tensor::Merger::combiSet
LatSetId combiSet(ExprId e, LatSetId s0, LatSetId s1, Operation *orig, bool includeLeft, TensorExp::Kind ltrans, Operation *opleft, bool includeRight, TensorExp::Kind rtrans, Operation *opright)
Disjunctive merge of two lattice sets with custom handling of the overlap, left, and right regions.
Definition: Merger.cpp:380

mlir::sparse_tensor::Merger::addTensorExp
ExprId addTensorExp(TensorId t)
Constructs a new tensor expression, and returns its identifier.
Definition: Merger.cpp:247

mlir::sparse_tensor::Merger::buildLattices
LatSetId buildLattices(ExprId e, LoopId i)
Builds the iteration lattices in a bottom-up traversal given the remaining tensor (sub)expression and...
Definition: Merger.cpp:940

mlir::sparse_tensor::Merger::conjSet
LatSetId conjSet(ExprId e, LatSetId s0, LatSetId s1, Operation *op=nullptr)
Conjunctive merge of two lattice sets: (s0 /\_op s1).
Definition: Merger.cpp:329

mlir::sparse_tensor::Merger::addExp
ExprId addExp(TensorExp::Kind k, ExprId e0, ExprId e1=detail::kInvalidId, Operation *op=nullptr, Attribute attr=nullptr)
Constructs a new unary or binary expression, and returns its identifier.
Definition: Merger.cpp:277

mlir::sparse_tensor::Merger::addSynZeroExp
ExprId addSynZeroExp()
Constructs a new synthetic zero expression.
Definition: Merger.cpp:270

mlir::sparse_tensor::Merger::makeLoopId
constexpr LoopId makeLoopId(unsigned i) const
Safely converts the argument to a loop identifier.
Definition: Merger.h:249

mlir::sparse_tensor::Merger::buildTensorExpFromLinalg
std::optional< ExprId > buildTensorExpFromLinalg(linalg::GenericOp op)
Builds a tensor expression from the given Linalg operation.
Definition: Merger.cpp:1193

mlir::sparse_tensor::Merger::mapSet
LatSetId mapSet(TensorExp::Kind kind, LatSetId s, Value v=Value(), Operation *op=nullptr, Attribute attr=nullptr)
Maps the unary operator over the lattice set of the operand, i.e.
Definition: Merger.cpp:401

mlir::sparse_tensor::Merger::set
ArrayRef< LatPointId > set(LatSetId s) const
Definition: Merger.h:549

mlir::sparse_tensor::Merger::optimizeSet
LatSetId optimizeSet(LatSetId s)
Optimizes the iteration lattice points in the given set.
Definition: Merger.cpp:431

mlir::sparse_tensor::Merger::tensor
constexpr TensorId tensor(TensorLoopId b) const
Gets the tensor-identifier of the TensorLoopId.
Definition: Merger.h:346

mlir::sparse_tensor::Merger::dumpExp
void dumpExp(ExprId e) const
Print methods (for debugging).
Definition: Merger.cpp:799

mlir::sparse_tensor::Merger::Merger
Merger(unsigned numInputOutputTensors, unsigned numLoops, unsigned maxLvlRank)
Constructs a merger for the given number of tensors and loops.
Definition: Merger.cpp:224

mlir::sparse_tensor::Merger::hasAnySparse
bool hasAnySparse(const BitVector &bits) const
Returns true if any TensorLoopId in the bitvector corresponds to sparse level-type.
Definition: Merger.cpp:671

mlir::sparse_tensor::Merger::addLat
LatPointId addLat(TensorId t, LoopId i, ExprId e)
Constructs a new iteration lattice point, and returns its identifier.
Definition: Merger.cpp:293

mlir::sparse_tensor::Merger::addLoopVarExp
ExprId addLoopVarExp(LoopId i)
Constructs a new loop-variable expression, and returns its identifier.
Definition: Merger.cpp:255

mlir::sparse_tensor::Merger::latGT
bool latGT(LatPointId p0, LatPointId p1) const
Returns true if p0 > p1.
Definition: Merger.cpp:503

mlir::sparse_tensor::Merger::exp
const TensorExp & exp(ExprId e) const
Convenience getters to immediately access the stored nodes.
Definition: Merger.h:541

mlir::sparse_tensor::Merger::loop
constexpr LoopId loop(TensorLoopId b) const
Gets the loop-identifier of the TensorLoopId.
Definition: Merger.h:348

mlir::sparse_tensor::Merger::lat
const LatPoint & lat(LatPointId p) const
Definition: Merger.h:545

mlir::sparse_tensor::Merger::onlyDenseDiff
bool onlyDenseDiff(LatPointId p0, LatPointId p1) const
Returns true if p0 and p1 only differ in dense.
Definition: Merger.cpp:516

mlir::sparse_tensor::Merger::addInvariantExp
ExprId addInvariantExp(Value v)
Constructs a new invariant expression, and returns its identifier.
Definition: Merger.cpp:263

mlir::sparse_tensor::Merger::makeTensorId
constexpr TensorId makeTensorId(unsigned t) const
Safely converts the argument to a tensor identifier.
Definition: Merger.h:243

mlir::sparse_tensor::Merger::getLvlType
LevelType getLvlType(TensorId t, LoopId i) const
Gets the level-type of the tth tensor on ith loop.
Definition: Merger.h:399

mlir::sparse_tensor::Merger::buildExp
Value buildExp(RewriterBase &rewriter, Location loc, ExprId e, Value v0, Value v1) const
Rebuilds SSA format from a tensor expression.
Definition: Merger.cpp:1618

mlir::sparse_tensor::Merger::makeTensorLoopId
constexpr TensorLoopId makeTensorLoopId(unsigned t, unsigned i) const
Safely converts the arguments to a pair of (tensor,loop) identifiers.
Definition: Merger.h:255

mlir::sparse_tensor::Merger::expIsTensor
bool expIsTensor(ExprId e, TensorId t) const
Returns true if the expression is (kTensor t).
Definition: Merger.h:370

Arith.h

Math.h

SparseTensor.h

mlir::remark::add
detail::LazyTextBuild add(const char *fmt, Ts &&...ts)
Create a Remark with llvm::formatv formatting.
Definition: Remarks.h:533

mlir::sparse_tensor::detail::kInvalidId
static constexpr unsigned kInvalidId
A constant serving as the canonically invalid identifier, regardless of the identifier type.
Definition: Merger.h:30

mlir::sparse_tensor::LevelFormat
LevelFormat
This enum defines all supported storage format without the level properties.
Definition: Enums.h:154

mlir::sparse_tensor::LevelFormat::Undef
@ Undef

mlir::sparse_tensor::isCertainZero
static bool isCertainZero(Value val)
Only returns true if we are certain this is a zero.
Definition: Merger.cpp:1201

mlir::sparse_tensor::isAdmissibleBranchExp
static bool isAdmissibleBranchExp(Operation *op, Block *block, Value v)
Ensures that the sparsifier can generate code for expression.
Definition: Merger.cpp:1244

mlir::sparse_tensor::LatSetId
unsigned LatSetId
LatSet identifiers.
Definition: Merger.h:57

mlir::sparse_tensor::insertYieldOp
static Value insertYieldOp(RewriterBase &rewriter, Location loc, Region &region, ValueRange vals)
Definition: Merger.cpp:1557

mlir::sparse_tensor::toMLIRString
std::string toMLIRString(LevelType lt)
Definition: Enums.h:447

mlir::sparse_tensor::LvlLTPair
std::pair< Level, LevelType > LvlLTPair
A pair of level and its corresponding LevelType of a tensor.
Definition: Merger.h:60

mlir::sparse_tensor::TensorLoopId
unsigned TensorLoopId
A compressed representation of std::pair<TensorId, LoopId>.
Definition: Merger.h:44

mlir::sparse_tensor::buildUnaryPresent
static Value buildUnaryPresent(RewriterBase &rewriter, Location loc, Operation *op, Value v0)
Definition: Merger.cpp:1574

mlir::sparse_tensor::Level
uint64_t Level
The type of level identifiers and level-ranks.
Definition: SparseTensor.h:42

mlir::sparse_tensor::buildBinaryOverlap
static Value buildBinaryOverlap(RewriterBase &rewriter, Location loc, Operation *op, Value v0, Value v1)
Definition: Merger.cpp:1588

mlir::sparse_tensor::isAdmissibleBranch
static bool isAdmissibleBranch(Operation *op, Region &region)
Ensures that the sparsifier can generate code for branch.
Definition: Merger.cpp:1264

mlir::sparse_tensor::LoopId
unsigned LoopId
Loop identifiers.
Definition: Merger.h:38

mlir::sparse_tensor::kindToOpSymbol
static const char * kindToOpSymbol(TensorExp::Kind kind)
Definition: Merger.cpp:693

mlir::sparse_tensor::getSparseTensorEncoding
SparseTensorEncodingAttr getSparseTensorEncoding(Type type)
Convenience method to get a sparse encoding attribute from a type.
Definition: SparseTensorDialect.cpp:1033

mlir::sparse_tensor::isGreater
static bool isGreater(TensorExp::Kind kind, Attribute attr)
Definition: Merger.cpp:1274

mlir::sparse_tensor::ExpArity
ExpArity
Definition: Merger.cpp:22

mlir::sparse_tensor::ExpArity::kNullary
@ kNullary

mlir::sparse_tensor::ExpArity::kBinary
@ kBinary

mlir::sparse_tensor::ExpArity::kUnary
@ kUnary

mlir::sparse_tensor::ExprId
unsigned ExprId
TensorExp identifiers.
Definition: Merger.h:48

mlir::sparse_tensor::getExpArity
static ExpArity getExpArity(TensorExp::Kind k)
Definition: Merger.cpp:28

mlir::sparse_tensor::buildRelu
static Value buildRelu(RewriterBase &rewriter, Location loc, Value v0, Attribute attr)
Definition: Merger.cpp:1602

mlir::sparse_tensor::LatPointId
unsigned LatPointId
LatPoint identifiers.
Definition: Merger.h:52

mlir::sparse_tensor::LoopCoeffPair
std::pair< LoopId, unsigned > LoopCoeffPair
A pair of loop id and its coefficients.
Definition: Merger.h:64

mlir::sparse_tensor::TensorId
unsigned TensorId
Tensor identifiers, chosen to be the BlockArgument::getArgNumber of the value passed to Merger::build...
Definition: Merger.h:35

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::get
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
Definition: BytecodeImplementation.h:509

mlir::sparse_tensor::LatPoint::bits
BitVector bits
Conjunction of all TensorLoopIds involved in the tensor expression.
Definition: Merger.h:210

mlir::sparse_tensor::LevelType
This enum defines all the sparse representations supportable by the SparseTensor dialect.
Definition: Enums.h:238

mlir::sparse_tensor::TensorExp::Children::e1
ExprId e1
Definition: Merger.h:73

mlir::sparse_tensor::TensorExp::Children::e0
ExprId e0
Definition: Merger.h:72

mlir::sparse_tensor::TensorExp::loop
LoopId loop
kLoopVar expressions simply have a loop identifier.
Definition: Merger.h:96

mlir::sparse_tensor::TensorExp::val
Value val
Direct link to IR for an invariant or the destination value (to infer destination type) of a cast ope...
Definition: Merger.h:105

mlir::sparse_tensor::TensorExp::Kind
Kind
Tensor expression kind.
Definition: Merger.h:129

mlir::sparse_tensor::TensorExp::Kind::kDivU
@ kDivU

mlir::sparse_tensor::TensorExp::Kind::kAbsF
@ kAbsF

mlir::sparse_tensor::TensorExp::Kind::kCastFU
@ kCastFU

mlir::sparse_tensor::TensorExp::Kind::kRelu
@ kRelu

mlir::sparse_tensor::TensorExp::Kind::kTanhC
@ kTanhC

mlir::sparse_tensor::TensorExp::Kind::kSelect
@ kSelect

mlir::sparse_tensor::TensorExp::Kind::kCeilF
@ kCeilF

mlir::sparse_tensor::TensorExp::Kind::kDenseOp
@ kDenseOp

mlir::sparse_tensor::TensorExp::Kind::kCastU
@ kCastU

mlir::sparse_tensor::TensorExp::Kind::kCastFS
@ kCastFS

mlir::sparse_tensor::TensorExp::Kind::kCRe
@ kCRe

mlir::sparse_tensor::TensorExp::Kind::kBinary
@ kBinary

mlir::sparse_tensor::TensorExp::Kind::kSynZero
@ kSynZero

mlir::sparse_tensor::TensorExp::Kind::kShlI
@ kShlI

mlir::sparse_tensor::TensorExp::Kind::kXorI
@ kXorI

mlir::sparse_tensor::TensorExp::Kind::kMulI
@ kMulI

mlir::sparse_tensor::TensorExp::Kind::kDivS
@ kDivS

mlir::sparse_tensor::TensorExp::Kind::kSinF
@ kSinF

mlir::sparse_tensor::TensorExp::Kind::kAddC
@ kAddC

mlir::sparse_tensor::TensorExp::Kind::kBitCast
@ kBitCast

mlir::sparse_tensor::TensorExp::Kind::kAbsI
@ kAbsI

mlir::sparse_tensor::TensorExp::Kind::kMulC
@ kMulC

mlir::sparse_tensor::TensorExp::Kind::kCmpI
@ kCmpI

mlir::sparse_tensor::TensorExp::Kind::kCmpF
@ kCmpF

mlir::sparse_tensor::TensorExp::Kind::kSinC
@ kSinC

mlir::sparse_tensor::TensorExp::Kind::kShrS
@ kShrS

mlir::sparse_tensor::TensorExp::Kind::kSubF
@ kSubF

mlir::sparse_tensor::TensorExp::Kind::kTruncI
@ kTruncI

mlir::sparse_tensor::TensorExp::Kind::kNegF
@ kNegF

mlir::sparse_tensor::TensorExp::Kind::kCastS
@ kCastS

mlir::sparse_tensor::TensorExp::Kind::kSubI
@ kSubI

mlir::sparse_tensor::TensorExp::Kind::kTensor
@ kTensor

mlir::sparse_tensor::TensorExp::Kind::kReduce
@ kReduce

mlir::sparse_tensor::TensorExp::Kind::kCIm
@ kCIm

mlir::sparse_tensor::TensorExp::Kind::kUnary
@ kUnary

mlir::sparse_tensor::TensorExp::Kind::kDivF
@ kDivF

mlir::sparse_tensor::TensorExp::Kind::kAndI
@ kAndI

mlir::sparse_tensor::TensorExp::Kind::kExtF
@ kExtF

mlir::sparse_tensor::TensorExp::Kind::kSubC
@ kSubC

mlir::sparse_tensor::TensorExp::Kind::kShrU
@ kShrU

mlir::sparse_tensor::TensorExp::Kind::kSqrtF
@ kSqrtF

mlir::sparse_tensor::TensorExp::Kind::kLog1pF
@ kLog1pF

mlir::sparse_tensor::TensorExp::Kind::kTruncF
@ kTruncF

mlir::sparse_tensor::TensorExp::Kind::kCastUF
@ kCastUF

mlir::sparse_tensor::TensorExp::Kind::kFloorF
@ kFloorF

mlir::sparse_tensor::TensorExp::Kind::kLoopVar
@ kLoopVar

mlir::sparse_tensor::TensorExp::Kind::kInvariant
@ kInvariant

mlir::sparse_tensor::TensorExp::Kind::kExpm1C
@ kExpm1C

mlir::sparse_tensor::TensorExp::Kind::kCastSF
@ kCastSF

mlir::sparse_tensor::TensorExp::Kind::kDivC
@ kDivC

mlir::sparse_tensor::TensorExp::Kind::kCastIdx
@ kCastIdx

mlir::sparse_tensor::TensorExp::Kind::kBinaryBranch
@ kBinaryBranch

mlir::sparse_tensor::TensorExp::Kind::kAddF
@ kAddF

mlir::sparse_tensor::TensorExp::Kind::kMulF
@ kMulF

mlir::sparse_tensor::TensorExp::Kind::kSqrtC
@ kSqrtC

mlir::sparse_tensor::TensorExp::Kind::kAbsC
@ kAbsC

mlir::sparse_tensor::TensorExp::Kind::kTanhF
@ kTanhF

mlir::sparse_tensor::TensorExp::Kind::kExpm1F
@ kExpm1F

mlir::sparse_tensor::TensorExp::Kind::kOrI
@ kOrI

mlir::sparse_tensor::TensorExp::Kind::kNegI
@ kNegI

mlir::sparse_tensor::TensorExp::Kind::kAddI
@ kAddI

mlir::sparse_tensor::TensorExp::Kind::kNegC
@ kNegC

mlir::sparse_tensor::TensorExp::Kind::kLog1pC
@ kLog1pC

mlir::sparse_tensor::TensorExp::children
Children children
All other expressions hold the ExprIds of their children.
Definition: Merger.h:99

mlir::sparse_tensor::TensorExp::attr
Attribute attr
An optional attribute that is required to determine the semantics of the operations.
Definition: Merger.h:118

mlir::sparse_tensor::TensorExp::tensor
TensorId tensor
kTensor expressions simply have a tensor identifier.
Definition: Merger.h:93

mlir::sparse_tensor::TensorExp::kind
Kind kind
Tensor expression kind.
Definition: Merger.h:89

mlir::sparse_tensor::TensorExp::TensorExp
TensorExp(Kind k, unsigned x, ExprId y, Value v, Operation *op, Attribute a)
The x parameter has different types depending on the value of the k parameter.
Definition: Merger.cpp:106

j
Eliminates variable at the specified position using Fourier-Motzkin variable elimination.