doxygen/Dialect_2Affine_2Utils_2Utils_8cpp_source.html

 //===- Utils.cpp ---- Utilities for affine dialect transformation ---------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//

 //

 // This file implements miscellaneous transformation utilities for the Affine

 // dialect.

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Dialect/Affine/Utils.h"


 #include "mlir/Dialect/Affine/Analysis/Utils.h"

 #include "mlir/Dialect/Affine/IR/AffineOps.h"

 #include "mlir/Dialect/Affine/IR/AffineValueMap.h"

 #include "mlir/Dialect/Affine/LoopUtils.h"

 #include "mlir/Dialect/Arith/Utils/Utils.h"

 #include "mlir/Dialect/Func/IR/FuncOps.h"

 #include "mlir/Dialect/MemRef/IR/MemRef.h"

 #include "mlir/Dialect/Utils/IndexingUtils.h"

 #include "mlir/IR/AffineExprVisitor.h"

 #include "mlir/IR/Dominance.h"

 #include "mlir/IR/IRMapping.h"

 #include "mlir/IR/IntegerSet.h"

 #include "mlir/Transforms/GreedyPatternRewriteDriver.h"

 #include <optional>


 #define DEBUG_TYPE "affine-utils"


 using namespace mlir;

 using namespace affine;

 using namespace presburger;


 namespace {

 /// Visit affine expressions recursively and build the sequence of operations

 /// that correspond to it.  Visitation functions return an Value of the

 /// expression subtree they visited or `nullptr` on error.

 class AffineApplyExpander

     : public AffineExprVisitor<AffineApplyExpander, Value> {

 public:

   /// This internal class expects arguments to be non-null, checks must be

   /// performed at the call site.

   AffineApplyExpander(OpBuilder &builder, ValueRange dimValues,

                       ValueRange symbolValues, Location loc)

       : builder(builder), dimValues(dimValues), symbolValues(symbolValues),

         loc(loc) {}


   template <typename OpTy>

   Value buildBinaryExpr(AffineBinaryOpExpr expr,

                         arith::IntegerOverflowFlags overflowFlags =

                             arith::IntegerOverflowFlags::none) {

     auto lhs = visit(expr.getLHS());

     auto rhs = visit(expr.getRHS());

     if (!lhs || !rhs)

       return nullptr;

     auto op = OpTy::create(builder, loc, lhs, rhs, overflowFlags);

     return op.getResult();

   }


   Value visitAddExpr(AffineBinaryOpExpr expr) {

     return buildBinaryExpr<arith::AddIOp>(expr);

   }


   Value visitMulExpr(AffineBinaryOpExpr expr) {

     return buildBinaryExpr<arith::MulIOp>(expr,

                                           arith::IntegerOverflowFlags::nsw);

   }


   /// Euclidean modulo operation: negative RHS is not allowed.

   /// Remainder of the euclidean integer division is always non-negative.

   ///

   /// Implemented as

   ///

   ///     a mod b =

   ///         let remainder = srem a, b;

   ///             negative = a < 0 in

   ///         select negative, remainder + b, remainder.

   Value visitModExpr(AffineBinaryOpExpr expr) {

     if (auto rhsConst = dyn_cast<AffineConstantExpr>(expr.getRHS())) {

       if (rhsConst.getValue() <= 0) {

         emitError(loc, "modulo by non-positive value is not supported");

         return nullptr;

       }

     }


     auto lhs = visit(expr.getLHS());

     auto rhs = visit(expr.getRHS());

     assert(lhs && rhs && "unexpected affine expr lowering failure");


     Value remainder = arith::RemSIOp::create(builder, loc, lhs, rhs);

     Value zeroCst = arith::ConstantIndexOp::create(builder, loc, 0);

     Value isRemainderNegative = arith::CmpIOp::create(

         builder, loc, arith::CmpIPredicate::slt, remainder, zeroCst);

     Value correctedRemainder =

         arith::AddIOp::create(builder, loc, remainder, rhs);

     Value result = arith::SelectOp::create(builder, loc, isRemainderNegative,

                                            correctedRemainder, remainder);

     return result;

   }


   /// Floor division operation (rounds towards negative infinity).

   ///

   /// For positive divisors, it can be implemented without branching and with a

   /// single division operation as

   ///

   ///        a floordiv b =

   ///            let negative = a < 0 in

   ///            let absolute = negative ? -a - 1 : a in

   ///            let quotient = absolute / b in

   ///                negative ? -quotient - 1 : quotient

   ///

   /// Note: this lowering does not use arith.floordivsi because the lowering of

   /// that to arith.divsi (see populateCeilFloorDivExpandOpsPatterns) generates

   /// not one but two arith.divsi. That could be changed to one divsi, but one

   /// way or another, going through arith.floordivsi will result in more complex

   /// IR because arith.floordivsi is more general than affine floordiv in that

   /// it supports negative RHS.

   Value visitFloorDivExpr(AffineBinaryOpExpr expr) {

     if (auto rhsConst = dyn_cast<AffineConstantExpr>(expr.getRHS())) {

       if (rhsConst.getValue() <= 0) {

         emitError(loc, "division by non-positive value is not supported");

         return nullptr;

       }

     }

     auto lhs = visit(expr.getLHS());

     auto rhs = visit(expr.getRHS());

     assert(lhs && rhs && "unexpected affine expr lowering failure");


     Value zeroCst = arith::ConstantIndexOp::create(builder, loc, 0);

     Value noneCst = arith::ConstantIndexOp::create(builder, loc, -1);

     Value negative = arith::CmpIOp::create(

         builder, loc, arith::CmpIPredicate::slt, lhs, zeroCst);

     Value negatedDecremented =

         arith::SubIOp::create(builder, loc, noneCst, lhs);

     Value dividend = arith::SelectOp::create(builder, loc, negative,

                                              negatedDecremented, lhs);

     Value quotient = arith::DivSIOp::create(builder, loc, dividend, rhs);

     Value correctedQuotient =

         arith::SubIOp::create(builder, loc, noneCst, quotient);

     Value result = arith::SelectOp::create(builder, loc, negative,

                                            correctedQuotient, quotient);

     return result;

   }


   /// Ceiling division operation (rounds towards positive infinity).

   ///

   /// For positive divisors, it can be implemented without branching and with a

   /// single division operation as

   ///

   ///     a ceildiv b =

   ///         let negative = a <= 0 in

   ///         let absolute = negative ? -a : a - 1 in

   ///         let quotient = absolute / b in

   ///             negative ? -quotient : quotient + 1

   ///

   /// Note: not using arith.ceildivsi for the same reason as explained in the

   /// visitFloorDivExpr comment.

   Value visitCeilDivExpr(AffineBinaryOpExpr expr) {

     if (auto rhsConst = dyn_cast<AffineConstantExpr>(expr.getRHS())) {

       if (rhsConst.getValue() <= 0) {

         emitError(loc, "division by non-positive value is not supported");

         return nullptr;

       }

     }

     auto lhs = visit(expr.getLHS());

     auto rhs = visit(expr.getRHS());

     assert(lhs && rhs && "unexpected affine expr lowering failure");


     Value zeroCst = arith::ConstantIndexOp::create(builder, loc, 0);

     Value oneCst = arith::ConstantIndexOp::create(builder, loc, 1);

     Value nonPositive = arith::CmpIOp::create(

         builder, loc, arith::CmpIPredicate::sle, lhs, zeroCst);

     Value negated = arith::SubIOp::create(builder, loc, zeroCst, lhs);

     Value decremented = arith::SubIOp::create(builder, loc, lhs, oneCst);

     Value dividend = arith::SelectOp::create(builder, loc, nonPositive, negated,

                                              decremented);

     Value quotient = arith::DivSIOp::create(builder, loc, dividend, rhs);

     Value negatedQuotient =

         arith::SubIOp::create(builder, loc, zeroCst, quotient);

     Value incrementedQuotient =

         arith::AddIOp::create(builder, loc, quotient, oneCst);

     Value result = arith::SelectOp::create(

         builder, loc, nonPositive, negatedQuotient, incrementedQuotient);

     return result;

   }


   Value visitConstantExpr(AffineConstantExpr expr) {

     auto op = arith::ConstantIndexOp::create(builder, loc, expr.getValue());

     return op.getResult();

   }


   Value visitDimExpr(AffineDimExpr expr) {

     assert(expr.getPosition() < dimValues.size() &&

            "affine dim position out of range");

     return dimValues[expr.getPosition()];

   }


   Value visitSymbolExpr(AffineSymbolExpr expr) {

     assert(expr.getPosition() < symbolValues.size() &&

            "symbol dim position out of range");

     return symbolValues[expr.getPosition()];

   }


 private:

   OpBuilder &builder;

   ValueRange dimValues;

   ValueRange symbolValues;


   Location loc;

 };

 } // namespace


 /// Create a sequence of operations that implement the `expr` applied to the

 /// given dimension and symbol values.

 mlir::Value mlir::affine::expandAffineExpr(OpBuilder &builder, Location loc,

                                            AffineExpr expr,

                                            ValueRange dimValues,

                                            ValueRange symbolValues) {

   return AffineApplyExpander(builder, dimValues, symbolValues, loc).visit(expr);

 }


 /// Create a sequence of operations that implement the `affineMap` applied to

 /// the given `operands` (as it it were an AffineApplyOp).

 std::optional<SmallVector<Value, 8>>

 mlir::affine::expandAffineMap(OpBuilder &builder, Location loc,

                               AffineMap affineMap, ValueRange operands) {

   auto numDims = affineMap.getNumDims();

   auto expanded = llvm::to_vector<8>(

       llvm::map_range(affineMap.getResults(),

                       [numDims, &builder, loc, operands](AffineExpr expr) {

                         return expandAffineExpr(builder, loc, expr,

                                                 operands.take_front(numDims),

                                                 operands.drop_front(numDims));

                       }));

   if (llvm::all_of(expanded, [](Value v) { return v; }))

     return expanded;

   return std::nullopt;

 }


 /// Promotes the `then` or the `else` block of `ifOp` (depending on whether

 /// `elseBlock` is false or true) into `ifOp`'s containing block, and discards

 /// the rest of the op.

 static void promoteIfBlock(AffineIfOp ifOp, bool elseBlock) {

   if (elseBlock)

     assert(ifOp.hasElse() && "else block expected");


   Block *destBlock = ifOp->getBlock();

   Block *srcBlock = elseBlock ? ifOp.getElseBlock() : ifOp.getThenBlock();

   destBlock->getOperations().splice(

       Block::iterator(ifOp), srcBlock->getOperations(), srcBlock->begin(),

       std::prev(srcBlock->end()));

   ifOp.erase();

 }


 /// Returns the outermost affine.for/parallel op that the `ifOp` is invariant

 /// on. The `ifOp` could be hoisted and placed right before such an operation.

 /// This method assumes that the ifOp has been canonicalized (to be correct and

 /// effective).

 static Operation *getOutermostInvariantForOp(AffineIfOp ifOp) {

   // Walk up the parents past all for op that this conditional is invariant on.

   auto ifOperands = ifOp.getOperands();

   Operation *res = ifOp;

   while (!res->getParentOp()->hasTrait<OpTrait::IsIsolatedFromAbove>()) {

     auto *parentOp = res->getParentOp();

     if (auto forOp = dyn_cast<AffineForOp>(parentOp)) {

       if (llvm::is_contained(ifOperands, forOp.getInductionVar()))

         break;

     } else if (auto parallelOp = dyn_cast<AffineParallelOp>(parentOp)) {

       if (llvm::any_of(parallelOp.getIVs(), [&](Value iv) {

             return llvm::is_contained(ifOperands, iv);

           }))

         break;

     } else if (!isa<AffineIfOp>(parentOp)) {

       // Won't walk up past anything other than affine.for/if ops.

       break;

     }

     // You can always hoist up past any affine.if ops.

     res = parentOp;

   }

   return res;

 }


 /// A helper for the mechanics of mlir::hoistAffineIfOp. Hoists `ifOp` just over

 /// `hoistOverOp`. Returns the new hoisted op if any hoisting happened,

 /// otherwise the same `ifOp`.

 static AffineIfOp hoistAffineIfOp(AffineIfOp ifOp, Operation *hoistOverOp) {

   // No hoisting to do.

   if (hoistOverOp == ifOp)

     return ifOp;


   // Create the hoisted 'if' first. Then, clone the op we are hoisting over for

   // the else block. Then drop the else block of the original 'if' in the 'then'

   // branch while promoting its then block, and analogously drop the 'then'

   // block of the original 'if' from the 'else' branch while promoting its else

   // block.

   IRMapping operandMap;

   OpBuilder b(hoistOverOp);

   auto hoistedIfOp = AffineIfOp::create(b, ifOp.getLoc(), ifOp.getIntegerSet(),

                                         ifOp.getOperands(),

                                         /*elseBlock=*/true);


   // Create a clone of hoistOverOp to use for the else branch of the hoisted

   // conditional. The else block may get optimized away if empty.

   Operation *hoistOverOpClone = nullptr;

   // We use this unique name to identify/find  `ifOp`'s clone in the else

   // version.

   StringAttr idForIfOp = b.getStringAttr("__mlir_if_hoisting");

   operandMap.clear();

   b.setInsertionPointAfter(hoistOverOp);

   // We'll set an attribute to identify this op in a clone of this sub-tree.

   ifOp->setAttr(idForIfOp, b.getBoolAttr(true));

   hoistOverOpClone = b.clone(*hoistOverOp, operandMap);


   // Promote the 'then' block of the original affine.if in the then version.

   promoteIfBlock(ifOp, /*elseBlock=*/false);


   // Move the then version to the hoisted if op's 'then' block.

   auto *thenBlock = hoistedIfOp.getThenBlock();

   thenBlock->getOperations().splice(thenBlock->begin(),

                                     hoistOverOp->getBlock()->getOperations(),

                                     Block::iterator(hoistOverOp));


   // Find the clone of the original affine.if op in the else version.

   AffineIfOp ifCloneInElse;

   hoistOverOpClone->walk([&](AffineIfOp ifClone) {

     if (!ifClone->getAttr(idForIfOp))

       return WalkResult::advance();

     ifCloneInElse = ifClone;

     return WalkResult::interrupt();

   });

   assert(ifCloneInElse && "if op clone should exist");

   // For the else block, promote the else block of the original 'if' if it had

   // one; otherwise, the op itself is to be erased.

   if (!ifCloneInElse.hasElse())

     ifCloneInElse.erase();

   else

     promoteIfBlock(ifCloneInElse, /*elseBlock=*/true);


   // Move the else version into the else block of the hoisted if op.

   auto *elseBlock = hoistedIfOp.getElseBlock();

   elseBlock->getOperations().splice(

       elseBlock->begin(), hoistOverOpClone->getBlock()->getOperations(),

       Block::iterator(hoistOverOpClone));


   return hoistedIfOp;

 }


 LogicalResult

 mlir::affine::affineParallelize(AffineForOp forOp,

                                 ArrayRef<LoopReduction> parallelReductions,

                                 AffineParallelOp *resOp) {

   // Fail early if there are iter arguments that are not reductions.

   unsigned numReductions = parallelReductions.size();

   if (numReductions != forOp.getNumIterOperands())

     return failure();


   Location loc = forOp.getLoc();

   OpBuilder outsideBuilder(forOp);

   AffineMap lowerBoundMap = forOp.getLowerBoundMap();

   ValueRange lowerBoundOperands = forOp.getLowerBoundOperands();

   AffineMap upperBoundMap = forOp.getUpperBoundMap();

   ValueRange upperBoundOperands = forOp.getUpperBoundOperands();


   // Creating empty 1-D affine.parallel op.

   auto reducedValues = llvm::to_vector<4>(llvm::map_range(

       parallelReductions, [](const LoopReduction &red) { return red.value; }));

   auto reductionKinds = llvm::to_vector<4>(llvm::map_range(

       parallelReductions, [](const LoopReduction &red) { return red.kind; }));

   AffineParallelOp newPloop = AffineParallelOp::create(

       outsideBuilder, loc, ValueRange(reducedValues).getTypes(), reductionKinds,

       llvm::ArrayRef(lowerBoundMap), lowerBoundOperands,

       llvm::ArrayRef(upperBoundMap), upperBoundOperands,

       llvm::ArrayRef(forOp.getStepAsInt()));

   // Steal the body of the old affine for op.

   newPloop.getRegion().takeBody(forOp.getRegion());

   Operation *yieldOp = &newPloop.getBody()->back();


   // Handle the initial values of reductions because the parallel loop always

   // starts from the neutral value.

   SmallVector<Value> newResults;

   newResults.reserve(numReductions);

   for (unsigned i = 0; i < numReductions; ++i) {

     Value init = forOp.getInits()[i];

     // This works because we are only handling single-op reductions at the

     // moment. A switch on reduction kind or a mechanism to collect operations

     // participating in the reduction will be necessary for multi-op reductions.

     Operation *reductionOp = yieldOp->getOperand(i).getDefiningOp();

     assert(reductionOp && "yielded value is expected to be produced by an op");

     outsideBuilder.getInsertionBlock()->getOperations().splice(

         outsideBuilder.getInsertionPoint(), newPloop.getBody()->getOperations(),

         reductionOp);

     reductionOp->setOperands({init, newPloop->getResult(i)});

     forOp->getResult(i).replaceAllUsesWith(reductionOp->getResult(0));

   }


   // Update the loop terminator to yield reduced values bypassing the reduction

   // operation itself (now moved outside of the loop) and erase the block

   // arguments that correspond to reductions. Note that the loop always has one

   // "main" induction variable whenc coming from a non-parallel for.

   unsigned numIVs = 1;

   yieldOp->setOperands(reducedValues);

   newPloop.getBody()->eraseArguments(numIVs, numReductions);


   forOp.erase();

   if (resOp)

     *resOp = newPloop;

   return success();

 }


 // Returns success if any hoisting happened.

 LogicalResult mlir::affine::hoistAffineIfOp(AffineIfOp ifOp, bool *folded) {

   // Bail out early if the ifOp returns a result.  TODO: Consider how to

   // properly support this case.

   if (ifOp.getNumResults() != 0)

     return failure();


   // Apply canonicalization patterns and folding - this is necessary for the

   // hoisting check to be correct (operands should be composed), and to be more

   // effective (no unused operands). Since the pattern rewriter's folding is

   // entangled with application of patterns, we may fold/end up erasing the op,

   // in which case we return with `folded` being set.

   RewritePatternSet patterns(ifOp.getContext());

   AffineIfOp::getCanonicalizationPatterns(patterns, ifOp.getContext());

   FrozenRewritePatternSet frozenPatterns(std::move(patterns));

   bool erased;

   (void)applyOpPatternsGreedily(

       ifOp.getOperation(), frozenPatterns,

       GreedyRewriteConfig().setStrictness(GreedyRewriteStrictness::ExistingOps),

       /*changed=*/nullptr, &erased);

   if (erased) {

     if (folded)

       *folded = true;

     return failure();

   }

   if (folded)

     *folded = false;


   // The folding above should have ensured this.

   assert(llvm::all_of(ifOp.getOperands(),

                       [](Value v) {

                         return isTopLevelValue(v) || isAffineInductionVar(v);

                       }) &&

          "operands not composed");


   // We are going hoist as high as possible.

   // TODO: this could be customized in the future.

   auto *hoistOverOp = getOutermostInvariantForOp(ifOp);


   AffineIfOp hoistedIfOp = ::hoistAffineIfOp(ifOp, hoistOverOp);

   // Nothing to hoist over.

   if (hoistedIfOp == ifOp)

     return failure();


   // Canonicalize to remove dead else blocks (happens whenever an 'if' moves up

   // a sequence of affine.fors that are all perfectly nested).

   (void)applyPatternsGreedily(

       hoistedIfOp->getParentWithTrait<OpTrait::IsIsolatedFromAbove>(),

       frozenPatterns);


   return success();

 }


 // Return the min expr after replacing the given dim.

 AffineExpr mlir::affine::substWithMin(AffineExpr e, AffineExpr dim,

                                       AffineExpr min, AffineExpr max,

                                       bool positivePath) {

   if (e == dim)

     return positivePath ? min : max;

   if (auto bin = dyn_cast<AffineBinaryOpExpr>(e)) {

     AffineExpr lhs = bin.getLHS();

     AffineExpr rhs = bin.getRHS();

     if (bin.getKind() == mlir::AffineExprKind::Add)

       return substWithMin(lhs, dim, min, max, positivePath) +

              substWithMin(rhs, dim, min, max, positivePath);


     auto c1 = dyn_cast<AffineConstantExpr>(bin.getLHS());

     auto c2 = dyn_cast<AffineConstantExpr>(bin.getRHS());

     if (c1 && c1.getValue() < 0)

       return getAffineBinaryOpExpr(

           bin.getKind(), c1, substWithMin(rhs, dim, min, max, !positivePath));

     if (c2 && c2.getValue() < 0)

       return getAffineBinaryOpExpr(

           bin.getKind(), substWithMin(lhs, dim, min, max, !positivePath), c2);

     return getAffineBinaryOpExpr(

         bin.getKind(), substWithMin(lhs, dim, min, max, positivePath),

         substWithMin(rhs, dim, min, max, positivePath));

   }

   return e;

 }


 void mlir::affine::normalizeAffineParallel(AffineParallelOp op) {

   // Loops with min/max in bounds are not normalized at the moment.

   if (op.hasMinMaxBounds())

     return;


   AffineMap lbMap = op.getLowerBoundsMap();

   SmallVector<int64_t, 8> steps = op.getSteps();

   // No need to do any work if the parallel op is already normalized.

   bool isAlreadyNormalized =

       llvm::all_of(llvm::zip(steps, lbMap.getResults()), [](auto tuple) {

         int64_t step = std::get<0>(tuple);

         auto lbExpr = dyn_cast<AffineConstantExpr>(std::get<1>(tuple));

         return lbExpr && lbExpr.getValue() == 0 && step == 1;

       });

   if (isAlreadyNormalized)

     return;


   AffineValueMap ranges;

   AffineValueMap::difference(op.getUpperBoundsValueMap(),

                              op.getLowerBoundsValueMap(), &ranges);

   auto builder = OpBuilder::atBlockBegin(op.getBody());

   auto zeroExpr = builder.getAffineConstantExpr(0);

   SmallVector<AffineExpr, 8> lbExprs;

   SmallVector<AffineExpr, 8> ubExprs;

   for (unsigned i = 0, e = steps.size(); i < e; ++i) {

     int64_t step = steps[i];


     // Adjust the lower bound to be 0.

     lbExprs.push_back(zeroExpr);


     // Adjust the upper bound expression: 'range / step'.

     AffineExpr ubExpr = ranges.getResult(i).ceilDiv(step);

     ubExprs.push_back(ubExpr);


     // Adjust the corresponding IV: 'lb + i * step'.

     BlockArgument iv = op.getBody()->getArgument(i);

     AffineExpr lbExpr = lbMap.getResult(i);

     unsigned nDims = lbMap.getNumDims();

     auto expr = lbExpr + builder.getAffineDimExpr(nDims) * step;

     auto map = AffineMap::get(/*dimCount=*/nDims + 1,

                               /*symbolCount=*/lbMap.getNumSymbols(), expr);


     // Use an 'affine.apply' op that will be simplified later in subsequent

     // canonicalizations.

     OperandRange lbOperands = op.getLowerBoundsOperands();

     OperandRange dimOperands = lbOperands.take_front(nDims);

     OperandRange symbolOperands = lbOperands.drop_front(nDims);

     SmallVector<Value, 8> applyOperands{dimOperands};

     applyOperands.push_back(iv);

     applyOperands.append(symbolOperands.begin(), symbolOperands.end());

     auto apply =

         AffineApplyOp::create(builder, op.getLoc(), map, applyOperands);

     iv.replaceAllUsesExcept(apply, apply);

   }


   SmallVector<int64_t, 8> newSteps(op.getNumDims(), 1);

   op.setSteps(newSteps);

   auto newLowerMap = AffineMap::get(

       /*dimCount=*/0, /*symbolCount=*/0, lbExprs, op.getContext());

   op.setLowerBounds({}, newLowerMap);

   auto newUpperMap = AffineMap::get(ranges.getNumDims(), ranges.getNumSymbols(),

                                     ubExprs, op.getContext());

   op.setUpperBounds(ranges.getOperands(), newUpperMap);

 }


 LogicalResult mlir::affine::normalizeAffineFor(AffineForOp op,

                                                bool promoteSingleIter) {

   if (promoteSingleIter && succeeded(promoteIfSingleIteration(op)))

     return success();


   // Check if the forop is already normalized.

   if (op.hasConstantLowerBound() && (op.getConstantLowerBound() == 0) &&

       (op.getStep() == 1))

     return success();


   // Check if the lower bound has a single result only. Loops with a max lower

   // bound can't be normalized without additional support like

   // affine.execute_region's. If the lower bound does not have a single result

   // then skip this op.

   if (op.getLowerBoundMap().getNumResults() != 1)

     return failure();


   Location loc = op.getLoc();

   OpBuilder opBuilder(op);

   int64_t origLoopStep = op.getStepAsInt();


   // Construct the new upper bound value map.

   AffineMap oldLbMap = op.getLowerBoundMap();

   // The upper bound can have multiple results. To use

   // AffineValueMap::difference, we need to have the same number of results in

   // both lower and upper bound maps. So, we just create a value map for the

   // lower bound with the only available lower bound result repeated to pad up

   // to the number of upper bound results.

   SmallVector<AffineExpr> lbExprs(op.getUpperBoundMap().getNumResults(),

                                   op.getLowerBoundMap().getResult(0));

   AffineValueMap lbMap(oldLbMap, op.getLowerBoundOperands());

   AffineMap paddedLbMap =

       AffineMap::get(oldLbMap.getNumDims(), oldLbMap.getNumSymbols(), lbExprs,

                      op.getContext());

   AffineValueMap paddedLbValueMap(paddedLbMap, op.getLowerBoundOperands());

   AffineValueMap ubValueMap(op.getUpperBoundMap(), op.getUpperBoundOperands());

   AffineValueMap newUbValueMap;

   // Compute the `upper bound - lower bound`.

   AffineValueMap::difference(ubValueMap, paddedLbValueMap, &newUbValueMap);

   (void)newUbValueMap.canonicalize();


   // Scale down the upper bound value map by the loop step.

   unsigned numResult = newUbValueMap.getNumResults();

   SmallVector<AffineExpr> scaleDownExprs(numResult);

   for (unsigned i = 0; i < numResult; ++i)

     scaleDownExprs[i] = opBuilder.getAffineDimExpr(i).ceilDiv(origLoopStep);

   // `scaleDownMap` is (d0, d1, ..., d_n) -> (d0 / step, d1 / step, ..., d_n /

   // step). Where `n` is the number of results in the upper bound map.

   AffineMap scaleDownMap =

       AffineMap::get(numResult, 0, scaleDownExprs, op.getContext());

   AffineMap newUbMap = scaleDownMap.compose(newUbValueMap.getAffineMap());


   // Set the newly create upper bound map and operands.

   op.setUpperBound(newUbValueMap.getOperands(), newUbMap);

   op.setLowerBound({}, opBuilder.getConstantAffineMap(0));

   op.setStep(1);


   // Calculate the Value of new loopIV. Create affine.apply for the value of

   // the loopIV in normalized loop.

   opBuilder.setInsertionPointToStart(op.getBody());

   // Construct an affine.apply op mapping the new IV to the old IV.

   AffineMap scaleIvMap =

       AffineMap::get(1, 0, -opBuilder.getAffineDimExpr(0) * origLoopStep);

   AffineValueMap scaleIvValueMap(scaleIvMap, ValueRange{op.getInductionVar()});

   AffineValueMap newIvToOldIvMap;

   AffineValueMap::difference(lbMap, scaleIvValueMap, &newIvToOldIvMap);

   (void)newIvToOldIvMap.canonicalize();

   auto newIV =

       AffineApplyOp::create(opBuilder, loc, newIvToOldIvMap.getAffineMap(),

                             newIvToOldIvMap.getOperands());

   op.getInductionVar().replaceAllUsesExcept(newIV->getResult(0), newIV);

   return success();

 }


 /// Returns true if the memory operation of `destAccess` depends on `srcAccess`

 /// inside of the innermost common surrounding affine loop between the two

 /// accesses.

 static bool mustReachAtInnermost(const MemRefAccess &srcAccess,

                                  const MemRefAccess &destAccess) {

   // Affine dependence analysis is possible only if both ops in the same

   // AffineScope.

   if (getAffineAnalysisScope(srcAccess.opInst) !=

       getAffineAnalysisScope(destAccess.opInst))

     return false;


   unsigned nsLoops =

       getNumCommonSurroundingLoops(*srcAccess.opInst, *destAccess.opInst);

   DependenceResult result =

       checkMemrefAccessDependence(srcAccess, destAccess, nsLoops + 1);

   return hasDependence(result);

 }


 /// Returns true if `srcMemOp` may have an effect on `destMemOp` within the

 /// scope of the outermost `minSurroundingLoops` loops that surround them.

 /// `srcMemOp` and `destMemOp` are expected to be affine read/write ops.

 static bool mayHaveEffect(Operation *srcMemOp, Operation *destMemOp,

                           unsigned minSurroundingLoops) {

   MemRefAccess srcAccess(srcMemOp);

   MemRefAccess destAccess(destMemOp);


   // Affine dependence analysis here is applicable only if both ops operate on

   // the same memref and if `srcMemOp` and `destMemOp` are in the same

   // AffineScope. Also, we can only check if our affine scope is isolated from

   // above; otherwise, values can from outside of the affine scope that the

   // check below cannot analyze.

   Region *srcScope = getAffineAnalysisScope(srcMemOp);

   if (srcAccess.memref == destAccess.memref &&

       srcScope == getAffineAnalysisScope(destMemOp)) {

     unsigned nsLoops = getNumCommonSurroundingLoops(*srcMemOp, *destMemOp);

     FlatAffineValueConstraints dependenceConstraints;

     for (unsigned d = nsLoops + 1; d > minSurroundingLoops; d--) {

       DependenceResult result = checkMemrefAccessDependence(

           srcAccess, destAccess, d, &dependenceConstraints,

           /*dependenceComponents=*/nullptr);

       // A dependence failure or the presence of a dependence implies a

       // side effect.

       if (!noDependence(result))

         return true;

     }

     // No side effect was seen.

     return false;

   }

   // TODO: Check here if the memrefs alias: there is no side effect if

   // `srcAccess.memref` and `destAccess.memref` don't alias.

   return true;

 }


 template <typename EffectType, typename T>

 bool mlir::affine::hasNoInterveningEffect(

     Operation *start, T memOp,

     llvm::function_ref<bool(Value, Value)> mayAlias) {

   // A boolean representing whether an intervening operation could have impacted

   // memOp.

   bool hasSideEffect = false;


   // Check whether the effect on memOp can be caused by a given operation op.

   Value memref = memOp.getMemRef();

   std::function<void(Operation *)> checkOperation = [&](Operation *op) {

     // If the effect has alreay been found, early exit,

     if (hasSideEffect)

       return;


     if (auto memEffect = dyn_cast<MemoryEffectOpInterface>(op)) {

       SmallVector<MemoryEffects::EffectInstance, 1> effects;

       memEffect.getEffects(effects);


       bool opMayHaveEffect = false;

       for (auto effect : effects) {

         // If op causes EffectType on a potentially aliasing location for

         // memOp, mark as having the effect.

         if (isa<EffectType>(effect.getEffect())) {

           if (effect.getValue() && effect.getValue() != memref &&

               !mayAlias(effect.getValue(), memref))

             continue;

           opMayHaveEffect = true;

           break;

         }

       }


       if (!opMayHaveEffect)

         return;


       // If the side effect comes from an affine read or write, try to

       // prove the side effecting `op` cannot reach `memOp`.

       if (isa<AffineReadOpInterface, AffineWriteOpInterface>(op)) {

         // For ease, let's consider the case that `op` is a store and

         // we're looking for other potential stores that overwrite memory after

         // `start`, and before being read in `memOp`. In this case, we only

         // need to consider other potential stores with depth >

         // minSurroundingLoops since `start` would overwrite any store with a

         // smaller number of surrounding loops before.

         unsigned minSurroundingLoops =

             getNumCommonSurroundingLoops(*start, *memOp);

         if (mayHaveEffect(op, memOp, minSurroundingLoops))

           hasSideEffect = true;

         return;

       }


       // We have an op with a memory effect and we cannot prove if it

       // intervenes.

       hasSideEffect = true;

       return;

     }


     if (op->hasTrait<OpTrait::HasRecursiveMemoryEffects>()) {

       // Recurse into the regions for this op and check whether the internal

       // operations may have the side effect `EffectType` on memOp.

       for (Region &region : op->getRegions())

         for (Block &block : region)

           for (Operation &op : block)

             checkOperation(&op);

       return;

     }


     // Otherwise, conservatively assume generic operations have the effect

     // on the operation

     hasSideEffect = true;

   };


   // Check all paths from ancestor op `parent` to the operation `to` for the

   // effect. It is known that `to` must be contained within `parent`.

   auto until = [&](Operation *parent, Operation *to) {

     // TODO check only the paths from `parent` to `to`.

     // Currently we fallback and check the entire parent op, rather than

     // just the paths from the parent path, stopping after reaching `to`.

     // This is conservatively correct, but could be made more aggressive.

     assert(parent->isAncestor(to));

     checkOperation(parent);

   };


   // Check for all paths from operation `from` to operation `untilOp` for the

   // given memory effect.

   std::function<void(Operation *, Operation *)> recur =

       [&](Operation *from, Operation *untilOp) {

         assert(

             from->getParentRegion()->isAncestor(untilOp->getParentRegion()) &&

             "Checking for side effect between two operations without a common "

             "ancestor");


         // If the operations are in different regions, recursively consider all

         // path from `from` to the parent of `to` and all paths from the parent

         // of `to` to `to`.

         if (from->getParentRegion() != untilOp->getParentRegion()) {

           recur(from, untilOp->getParentOp());

           until(untilOp->getParentOp(), untilOp);

           return;

         }


         // Now, assuming that `from` and `to` exist in the same region, perform

         // a CFG traversal to check all the relevant operations.


         // Additional blocks to consider.

         SmallVector<Block *, 2> todoBlocks;

         {

           // First consider the parent block of `from` an check all operations

           // after `from`.

           for (auto iter = ++from->getIterator(), end = from->getBlock()->end();

                iter != end && &*iter != untilOp; ++iter) {

             checkOperation(&*iter);

           }


           // If the parent of `from` doesn't contain `to`, add the successors

           // to the list of blocks to check.

           if (untilOp->getBlock() != from->getBlock())

             for (Block *succ : from->getBlock()->getSuccessors())

               todoBlocks.push_back(succ);

         }


         SmallPtrSet<Block *, 4> done;

         // Traverse the CFG until hitting `to`.

         while (!todoBlocks.empty()) {

           Block *blk = todoBlocks.pop_back_val();

           if (done.count(blk))

             continue;

           done.insert(blk);

           for (auto &op : *blk) {

             if (&op == untilOp)

               break;

             checkOperation(&op);

             if (&op == blk->getTerminator())

               for (Block *succ : blk->getSuccessors())

                 todoBlocks.push_back(succ);

           }

         }

       };

   recur(start, memOp);

   return !hasSideEffect;

 }


 /// Attempt to eliminate loadOp by replacing it with a value stored into memory

 /// which the load is guaranteed to retrieve. This check involves three

 /// components: 1) The store and load must be on the same location 2) The store

 /// must dominate (and therefore must always occur prior to) the load 3) No

 /// other operations will overwrite the memory loaded between the given load

 /// and store.  If such a value exists, the replaced `loadOp` will be added to

 /// `loadOpsToErase` and its memref will be added to `memrefsToErase`.

 static void forwardStoreToLoad(

     AffineReadOpInterface loadOp, SmallVectorImpl<Operation *> &loadOpsToErase,

     SmallPtrSetImpl<Value> &memrefsToErase, DominanceInfo &domInfo,

     llvm::function_ref<bool(Value, Value)> mayAlias) {


   // The store op candidate for forwarding that satisfies all conditions

   // to replace the load, if any.

   Operation *lastWriteStoreOp = nullptr;


   for (auto *user : loadOp.getMemRef().getUsers()) {

     auto storeOp = dyn_cast<AffineWriteOpInterface>(user);

     if (!storeOp)

       continue;

     MemRefAccess srcAccess(storeOp);

     MemRefAccess destAccess(loadOp);


     // 1. Check if the store and the load have mathematically equivalent

     // affine access functions; this implies that they statically refer to the

     // same single memref element. As an example this filters out cases like:

     //     store %A[%i0 + 1]

     //     load %A[%i0]

     //     store %A[%M]

     //     load %A[%N]

     // Use the AffineValueMap difference based memref access equality checking.

     if (srcAccess != destAccess)

       continue;


     // 2. The store has to dominate the load op to be candidate.

     if (!domInfo.dominates(storeOp, loadOp))

       continue;


     // 3. The store must reach the load. Access function equivalence only

     // guarantees this for accesses in the same block. The load could be in a

     // nested block that is unreachable.

     if (!mustReachAtInnermost(srcAccess, destAccess))

       continue;


     // 4. Ensure there is no intermediate operation which could replace the

     // value in memory.

     if (!affine::hasNoInterveningEffect<MemoryEffects::Write>(storeOp, loadOp,

                                                               mayAlias))

       continue;


     // We now have a candidate for forwarding.

     assert(lastWriteStoreOp == nullptr &&

            "multiple simultaneous replacement stores");

     lastWriteStoreOp = storeOp;

   }


   if (!lastWriteStoreOp)

     return;


   // Perform the actual store to load forwarding.

   Value storeVal =

       cast<AffineWriteOpInterface>(lastWriteStoreOp).getValueToStore();

   // Check if 2 values have the same shape. This is needed for affine vector

   // loads and stores.

   if (storeVal.getType() != loadOp.getValue().getType())

     return;

   loadOp.getValue().replaceAllUsesWith(storeVal);

   // Record the memref for a later sweep to optimize away.

   memrefsToErase.insert(loadOp.getMemRef());

   // Record this to erase later.

   loadOpsToErase.push_back(loadOp);

 }


 template bool

 mlir::affine::hasNoInterveningEffect<mlir::MemoryEffects::Read,

                                      affine::AffineReadOpInterface>(

     mlir::Operation *, affine::AffineReadOpInterface,

     llvm::function_ref<bool(Value, Value)>);


 // This attempts to find stores which have no impact on the final result.

 // A writing op writeA will be eliminated if there exists an op writeB if

 // 1) writeA and writeB have mathematically equivalent affine access functions.

 // 2) writeB postdominates writeA.

 // 3) There is no potential read between writeA and writeB.

 static void findUnusedStore(AffineWriteOpInterface writeA,

                             SmallVectorImpl<Operation *> &opsToErase,

                             PostDominanceInfo &postDominanceInfo,

                             llvm::function_ref<bool(Value, Value)> mayAlias) {


   for (Operation *user : writeA.getMemRef().getUsers()) {

     // Only consider writing operations.

     auto writeB = dyn_cast<AffineWriteOpInterface>(user);

     if (!writeB)

       continue;


     // The operations must be distinct.

     if (writeB == writeA)

       continue;


     // Both operations must lie in the same region.

     if (writeB->getParentRegion() != writeA->getParentRegion())

       continue;


     // Both operations must write to the same memory.

     MemRefAccess srcAccess(writeB);

     MemRefAccess destAccess(writeA);


     if (srcAccess != destAccess)

       continue;


     // writeB must postdominate writeA.

     if (!postDominanceInfo.postDominates(writeB, writeA))

       continue;


     // There cannot be an operation which reads from memory between

     // the two writes.

     if (!affine::hasNoInterveningEffect<MemoryEffects::Read>(writeA, writeB,

                                                              mayAlias))

       continue;


     opsToErase.push_back(writeA);

     break;

   }

 }


 // The load to load forwarding / redundant load elimination is similar to the

 // store to load forwarding.

 // loadA will be be replaced with loadB if:

 // 1) loadA and loadB have mathematically equivalent affine access functions.

 // 2) loadB dominates loadA.

 // 3) There is no write between loadA and loadB.

 static void loadCSE(AffineReadOpInterface loadA,

                     SmallVectorImpl<Operation *> &loadOpsToErase,

                     DominanceInfo &domInfo,

                     llvm::function_ref<bool(Value, Value)> mayAlias) {

   SmallVector<AffineReadOpInterface, 4> loadCandidates;

   for (auto *user : loadA.getMemRef().getUsers()) {

     auto loadB = dyn_cast<AffineReadOpInterface>(user);

     if (!loadB || loadB == loadA)

       continue;


     MemRefAccess srcAccess(loadB);

     MemRefAccess destAccess(loadA);


     // 1. The accesses should be to be to the same location.

     if (srcAccess != destAccess) {

       continue;

     }


     // 2. loadB should dominate loadA.

     if (!domInfo.dominates(loadB, loadA))

       continue;


     // 3. There should not be a write between loadA and loadB.

     if (!affine::hasNoInterveningEffect<MemoryEffects::Write>(

             loadB.getOperation(), loadA, mayAlias))

       continue;


     // Check if two values have the same shape. This is needed for affine vector

     // loads.

     if (loadB.getValue().getType() != loadA.getValue().getType())

       continue;


     loadCandidates.push_back(loadB);

   }


   // Of the legal load candidates, use the one that dominates all others

   // to minimize the subsequent need to loadCSE

   Value loadB;

   for (AffineReadOpInterface option : loadCandidates) {

     if (llvm::all_of(loadCandidates, [&](AffineReadOpInterface depStore) {

           return depStore == option ||

                  domInfo.dominates(option.getOperation(),

                                    depStore.getOperation());

         })) {

       loadB = option.getValue();

       break;

     }

   }


   if (loadB) {

     loadA.getValue().replaceAllUsesWith(loadB);

     // Record this to erase later.

     loadOpsToErase.push_back(loadA);

   }

 }


 // The store to load forwarding and load CSE rely on three conditions:

 //

 // 1) store/load providing a replacement value and load being replaced need to

 // have mathematically equivalent affine access functions (checked after full

 // composition of load/store operands); this implies that they access the same

 // single memref element for all iterations of the common surrounding loop,

 //

 // 2) the store/load op should dominate the load op,

 //

 // 3) no operation that may write to memory read by the load being replaced can

 // occur after executing the instruction (load or store) providing the

 // replacement value and before the load being replaced (thus potentially

 // allowing overwriting the memory read by the load).

 //

 // The above conditions are simple to check, sufficient, and powerful for most

 // cases in practice - they are sufficient, but not necessary --- since they

 // don't reason about loops that are guaranteed to execute at least once or

 // multiple sources to forward from.

 //

 // TODO: more forwarding can be done when support for

 // loop/conditional live-out SSA values is available.

 // TODO: do general dead store elimination for memref's. This pass

 // currently only eliminates the stores only if no other loads/uses (other

 // than dealloc) remain.

 //

 void mlir::affine::affineScalarReplace(func::FuncOp f, DominanceInfo &domInfo,

                                        PostDominanceInfo &postDomInfo,

                                        AliasAnalysis &aliasAnalysis) {

   // Load op's whose results were replaced by those forwarded from stores.

   SmallVector<Operation *, 8> opsToErase;


   // A list of memref's that are potentially dead / could be eliminated.

   SmallPtrSet<Value, 4> memrefsToErase;


   auto mayAlias = [&](Value val1, Value val2) -> bool {

     return !aliasAnalysis.alias(val1, val2).isNo();

   };


   // Walk all load's and perform store to load forwarding.

   f.walk([&](AffineReadOpInterface loadOp) {

     forwardStoreToLoad(loadOp, opsToErase, memrefsToErase, domInfo, mayAlias);

   });

   for (auto *op : opsToErase)

     op->erase();

   opsToErase.clear();


   // Walk all store's and perform unused store elimination

   f.walk([&](AffineWriteOpInterface storeOp) {

     findUnusedStore(storeOp, opsToErase, postDomInfo, mayAlias);

   });

   for (auto *op : opsToErase)

     op->erase();

   opsToErase.clear();


   // Check if the store fwd'ed memrefs are now left with only stores and

   // deallocs and can thus be completely deleted. Note: the canonicalize pass

   // should be able to do this as well, but we'll do it here since we collected

   // these anyway.

   for (auto memref : memrefsToErase) {

     // If the memref hasn't been locally alloc'ed, skip.

     Operation *defOp = memref.getDefiningOp();

     if (!defOp || !hasSingleEffect<MemoryEffects::Allocate>(defOp, memref))

       // TODO: if the memref was returned by a 'call' operation, we

       // could still erase it if the call had no side-effects.

       continue;

     if (llvm::any_of(memref.getUsers(), [&](Operation *ownerOp) {

           return !isa<AffineWriteOpInterface>(ownerOp) &&

                  !hasSingleEffect<MemoryEffects::Free>(ownerOp, memref);

         }))

       continue;


     // Erase all stores, the dealloc, and the alloc on the memref.

     for (auto *user : llvm::make_early_inc_range(memref.getUsers()))

       user->erase();

     defOp->erase();

   }


   // To eliminate as many loads as possible, run load CSE after eliminating

   // stores. Otherwise, some stores are wrongly seen as having an intervening

   // effect.

   f.walk([&](AffineReadOpInterface loadOp) {

     loadCSE(loadOp, opsToErase, domInfo, mayAlias);

   });

   for (auto *op : opsToErase)

     op->erase();

 }


 // Checks if `op` is non dereferencing.

 // TODO: This hardcoded check will be removed once the right interface is added.

 static bool isDereferencingOp(Operation *op) {

   return isa<AffineMapAccessInterface, memref::LoadOp, memref::StoreOp>(op);

 }


 // Perform the replacement in `op`.

 LogicalResult mlir::affine::replaceAllMemRefUsesWith(

     Value oldMemRef, Value newMemRef, Operation *op,

     ArrayRef<Value> extraIndices, AffineMap indexRemap,

     ArrayRef<Value> extraOperands, ArrayRef<Value> symbolOperands,

     bool allowNonDereferencingOps) {

   unsigned newMemRefRank = cast<MemRefType>(newMemRef.getType()).getRank();

   (void)newMemRefRank; // unused in opt mode

   unsigned oldMemRefRank = cast<MemRefType>(oldMemRef.getType()).getRank();

   (void)oldMemRefRank; // unused in opt mode

   if (indexRemap) {

     assert(indexRemap.getNumSymbols() == symbolOperands.size() &&

            "symbolic operand count mismatch");

     assert(indexRemap.getNumInputs() ==

            extraOperands.size() + oldMemRefRank + symbolOperands.size());

     assert(indexRemap.getNumResults() + extraIndices.size() == newMemRefRank);

   } else {

     assert(oldMemRefRank + extraIndices.size() == newMemRefRank);

   }


   // Assert same elemental type.

   assert(cast<MemRefType>(oldMemRef.getType()).getElementType() ==

          cast<MemRefType>(newMemRef.getType()).getElementType());


   SmallVector<unsigned, 2> usePositions;

   for (const auto &opEntry : llvm::enumerate(op->getOperands())) {

     if (opEntry.value() == oldMemRef)

       usePositions.push_back(opEntry.index());

   }


   // If memref doesn't appear, nothing to do.

   if (usePositions.empty())

     return success();


   unsigned memRefOperandPos = usePositions.front();


   OpBuilder builder(op);

   // The following checks if op is dereferencing memref and performs the access

   // index rewrites.

   if (!isDereferencingOp(op)) {

     if (!allowNonDereferencingOps) {

       // Failure: memref used in a non-dereferencing context (potentially

       // escapes); no replacement in these cases unless allowNonDereferencingOps

       // is set.

       return failure();

     }

     for (unsigned pos : usePositions)

       op->setOperand(pos, newMemRef);

     return success();

   }


   if (usePositions.size() > 1) {

     // TODO: extend it for this case when needed (rare).

     LLVM_DEBUG(llvm::dbgs()

                << "multiple dereferencing uses in a single op not supported");

     return failure();

   }


   // Perform index rewrites for the dereferencing op and then replace the op.

   SmallVector<Value, 4> oldMapOperands;

   AffineMap oldMap;

   unsigned oldMemRefNumIndices = oldMemRefRank;

   auto startIdx = op->operand_begin() + memRefOperandPos + 1;

   auto affMapAccInterface = dyn_cast<AffineMapAccessInterface>(op);

   if (affMapAccInterface) {

     // If `op` implements AffineMapAccessInterface, we can get the indices by

     // quering the number of map operands from the operand list from a certain

     // offset (`memRefOperandPos` in this case).

     NamedAttribute oldMapAttrPair =

         affMapAccInterface.getAffineMapAttrForMemRef(oldMemRef);

     oldMap = cast<AffineMapAttr>(oldMapAttrPair.getValue()).getValue();

     oldMemRefNumIndices = oldMap.getNumInputs();

   }

   oldMapOperands.assign(startIdx, startIdx + oldMemRefNumIndices);


   // Apply 'oldMemRefOperands = oldMap(oldMapOperands)'.

   SmallVector<Value, 4> oldMemRefOperands;

   SmallVector<Value, 4> affineApplyOps;

   oldMemRefOperands.reserve(oldMemRefRank);

   if (affMapAccInterface &&

       oldMap != builder.getMultiDimIdentityMap(oldMap.getNumDims())) {

     for (auto resultExpr : oldMap.getResults()) {

       auto singleResMap = AffineMap::get(oldMap.getNumDims(),

                                          oldMap.getNumSymbols(), resultExpr);

       auto afOp = AffineApplyOp::create(builder, op->getLoc(), singleResMap,

                                         oldMapOperands);

       oldMemRefOperands.push_back(afOp);

       affineApplyOps.push_back(afOp);

     }

   } else {

     oldMemRefOperands.assign(oldMapOperands.begin(), oldMapOperands.end());

   }


   // Construct new indices as a remap of the old ones if a remapping has been

   // provided. The indices of a memref come right after it, i.e.,

   // at position memRefOperandPos + 1.

   SmallVector<Value, 4> remapOperands;

   remapOperands.reserve(extraOperands.size() + oldMemRefRank +

                         symbolOperands.size());

   remapOperands.append(extraOperands.begin(), extraOperands.end());

   remapOperands.append(oldMemRefOperands.begin(), oldMemRefOperands.end());

   remapOperands.append(symbolOperands.begin(), symbolOperands.end());


   SmallVector<Value, 4> remapOutputs;

   remapOutputs.reserve(oldMemRefRank);

   if (indexRemap &&

       indexRemap != builder.getMultiDimIdentityMap(indexRemap.getNumDims())) {

     // Remapped indices.

     for (auto resultExpr : indexRemap.getResults()) {

       auto singleResMap = AffineMap::get(

           indexRemap.getNumDims(), indexRemap.getNumSymbols(), resultExpr);

       auto afOp = AffineApplyOp::create(builder, op->getLoc(), singleResMap,

                                         remapOperands);

       remapOutputs.push_back(afOp);

       affineApplyOps.push_back(afOp);

     }

   } else {

     // No remapping specified.

     remapOutputs.assign(remapOperands.begin(), remapOperands.end());

   }

   SmallVector<Value, 4> newMapOperands;

   newMapOperands.reserve(newMemRefRank);


   // Prepend 'extraIndices' in 'newMapOperands'.

   for (Value extraIndex : extraIndices) {

     assert((isValidDim(extraIndex) || isValidSymbol(extraIndex)) &&

            "invalid memory op index");

     newMapOperands.push_back(extraIndex);

   }


   // Append 'remapOutputs' to 'newMapOperands'.

   newMapOperands.append(remapOutputs.begin(), remapOutputs.end());


   // Create new fully composed AffineMap for new op to be created.

   assert(newMapOperands.size() == newMemRefRank);

   auto newMap = builder.getMultiDimIdentityMap(newMemRefRank);

   fullyComposeAffineMapAndOperands(&newMap, &newMapOperands);

   newMap = simplifyAffineMap(newMap);

   canonicalizeMapAndOperands(&newMap, &newMapOperands);

   // Remove any affine.apply's that became dead as a result of composition.

   for (Value value : affineApplyOps)

     if (value.use_empty())

       value.getDefiningOp()->erase();


   OperationState state(op->getLoc(), op->getName());

   // Construct the new operation using this memref.

   state.operands.reserve(op->getNumOperands() + extraIndices.size());

   // Insert the non-memref operands.

   state.operands.append(op->operand_begin(),

                         op->operand_begin() + memRefOperandPos);

   // Insert the new memref value.

   state.operands.push_back(newMemRef);


   // Insert the new memref map operands.

   if (affMapAccInterface) {

     state.operands.append(newMapOperands.begin(), newMapOperands.end());

   } else {

     // In the case of dereferencing ops not implementing

     // AffineMapAccessInterface, we need to apply the values of `newMapOperands`

     // to the `newMap` to get the correct indices.

     for (unsigned i = 0; i < newMemRefRank; i++) {

       state.operands.push_back(AffineApplyOp::create(

           builder, op->getLoc(),

           AffineMap::get(newMap.getNumDims(), newMap.getNumSymbols(),

                          newMap.getResult(i)),

           newMapOperands));

     }

   }


   // Insert the remaining operands unmodified.

   unsigned oldMapNumInputs = oldMapOperands.size();

   state.operands.append(op->operand_begin() + memRefOperandPos + 1 +

                             oldMapNumInputs,

                         op->operand_end());

   // Result types don't change. Both memref's are of the same elemental type.

   state.types.reserve(op->getNumResults());

   for (auto result : op->getResults())

     state.types.push_back(result.getType());


   // Add attribute for 'newMap', other Attributes do not change.

   auto newMapAttr = AffineMapAttr::get(newMap);

   for (auto namedAttr : op->getAttrs()) {

     if (affMapAccInterface &&

         namedAttr.getName() ==

             affMapAccInterface.getAffineMapAttrForMemRef(oldMemRef).getName())

       state.attributes.push_back({namedAttr.getName(), newMapAttr});

     else

       state.attributes.push_back(namedAttr);

   }


   // Create the new operation.

   auto *repOp = builder.create(state);

   op->replaceAllUsesWith(repOp);

   op->erase();


   return success();

 }


 LogicalResult mlir::affine::replaceAllMemRefUsesWith(

     Value oldMemRef, Value newMemRef, ArrayRef<Value> extraIndices,

     AffineMap indexRemap, ArrayRef<Value> extraOperands,

     ArrayRef<Value> symbolOperands,

     llvm::function_ref<bool(Operation *)> userFilterFn,

     bool allowNonDereferencingOps, bool replaceInDeallocOp) {

   unsigned newMemRefRank = cast<MemRefType>(newMemRef.getType()).getRank();

   (void)newMemRefRank; // unused in opt mode

   unsigned oldMemRefRank = cast<MemRefType>(oldMemRef.getType()).getRank();

   (void)oldMemRefRank;

   if (indexRemap) {

     assert(indexRemap.getNumSymbols() == symbolOperands.size() &&

            "symbol operand count mismatch");

     assert(indexRemap.getNumInputs() ==

            extraOperands.size() + oldMemRefRank + symbolOperands.size());

     assert(indexRemap.getNumResults() + extraIndices.size() == newMemRefRank);

   } else {

     assert(oldMemRefRank + extraIndices.size() == newMemRefRank);

   }


   // Assert same elemental type.

   assert(cast<MemRefType>(oldMemRef.getType()).getElementType() ==

          cast<MemRefType>(newMemRef.getType()).getElementType());


   std::unique_ptr<DominanceInfo> domInfo;

   std::unique_ptr<PostDominanceInfo> postDomInfo;


   // Walk all uses of old memref; collect ops to perform replacement. We use a

   // DenseSet since an operation could potentially have multiple uses of a

   // memref (although rare), and the replacement later is going to erase ops.

   DenseSet<Operation *> opsToReplace;

   for (auto *user : oldMemRef.getUsers()) {

     // Check if this user doesn't pass the filter.

     if (userFilterFn && !userFilterFn(user))

       continue;


     // Skip dealloc's - no replacement is necessary, and a memref replacement

     // at other uses doesn't hurt these dealloc's.

     if (hasSingleEffect<MemoryEffects::Free>(user, oldMemRef) &&

         !replaceInDeallocOp)

       continue;


     // Check if the memref was used in a non-dereferencing context. It is fine

     // for the memref to be used in a non-dereferencing way outside of the

     // region where this replacement is happening.

     if (!isa<AffineMapAccessInterface>(*user)) {

       if (!allowNonDereferencingOps) {

         LLVM_DEBUG(

             llvm::dbgs()

             << "Memref replacement failed: non-deferencing memref user: \n"

             << *user << '\n');

         return failure();

       }

       // Non-dereferencing ops with the MemRefsNormalizable trait are

       // supported for replacement.

       if (!user->hasTrait<OpTrait::MemRefsNormalizable>()) {

         LLVM_DEBUG(llvm::dbgs() << "Memref replacement failed: use without a "

                                    "memrefs normalizable trait: \n"

                                 << *user << '\n');

         return failure();

       }

     }


     // We'll first collect and then replace --- since replacement erases the

     // user that has the use, and that user could be postDomFilter or domFilter

     // itself!

     opsToReplace.insert(user);

   }


   for (auto *user : opsToReplace) {

     if (failed(replaceAllMemRefUsesWith(

             oldMemRef, newMemRef, user, extraIndices, indexRemap, extraOperands,

             symbolOperands, allowNonDereferencingOps)))

       llvm_unreachable("memref replacement guaranteed to succeed here");

   }


   return success();

 }


 /// Given an operation, inserts one or more single result affine

 /// apply operations, results of which are exclusively used by this operation

 /// operation. The operands of these newly created affine apply ops are

 /// guaranteed to be loop iterators or terminal symbols of a function.

 ///

 /// Before

 ///

 /// affine.for %i = 0 to #map(%N)

 ///   %idx = affine.apply (d0) -> (d0 mod 2) (%i)

 ///   "send"(%idx, %A, ...)

 ///   "compute"(%idx)

 ///

 /// After

 ///

 /// affine.for %i = 0 to #map(%N)

 ///   %idx = affine.apply (d0) -> (d0 mod 2) (%i)

 ///   "send"(%idx, %A, ...)

 ///   %idx_ = affine.apply (d0) -> (d0 mod 2) (%i)

 ///   "compute"(%idx_)

 ///

 /// This allows applying different transformations on send and compute (for eg.

 /// different shifts/delays).

 ///

 /// Returns nullptr either if none of opInst's operands were the result of an

 /// affine.apply and thus there was no affine computation slice to create, or if

 /// all the affine.apply op's supplying operands to this opInst did not have any

 /// uses besides this opInst; otherwise returns the list of affine.apply

 /// operations created in output argument `sliceOps`.

 void mlir::affine::createAffineComputationSlice(

     Operation *opInst, SmallVectorImpl<AffineApplyOp> *sliceOps) {

   // Collect all operands that are results of affine apply ops.

   SmallVector<Value, 4> subOperands;

   subOperands.reserve(opInst->getNumOperands());

   for (auto operand : opInst->getOperands())

     if (isa_and_nonnull<AffineApplyOp>(operand.getDefiningOp()))

       subOperands.push_back(operand);


   // Gather sequence of AffineApplyOps reachable from 'subOperands'.

   SmallVector<Operation *, 4> affineApplyOps;

   getReachableAffineApplyOps(subOperands, affineApplyOps);

   // Skip transforming if there are no affine maps to compose.

   if (affineApplyOps.empty())

     return;


   // Check if all uses of the affine apply op's lie only in this op op, in

   // which case there would be nothing to do.

   bool localized = true;

   for (auto *op : affineApplyOps) {

     for (auto result : op->getResults()) {

       for (auto *user : result.getUsers()) {

         if (user != opInst) {

           localized = false;

           break;

         }

       }

     }

   }

   if (localized)

     return;


   OpBuilder builder(opInst);

   SmallVector<Value, 4> composedOpOperands(subOperands);

   auto composedMap = builder.getMultiDimIdentityMap(composedOpOperands.size());

   fullyComposeAffineMapAndOperands(&composedMap, &composedOpOperands);


   // Create an affine.apply for each of the map results.

   sliceOps->reserve(composedMap.getNumResults());

   for (auto resultExpr : composedMap.getResults()) {

     auto singleResMap = AffineMap::get(composedMap.getNumDims(),

                                        composedMap.getNumSymbols(), resultExpr);

     sliceOps->push_back(AffineApplyOp::create(

         builder, opInst->getLoc(), singleResMap, composedOpOperands));

   }


   // Construct the new operands that include the results from the composed

   // affine apply op above instead of existing ones (subOperands). So, they

   // differ from opInst's operands only for those operands in 'subOperands', for

   // which they will be replaced by the corresponding one from 'sliceOps'.

   SmallVector<Value, 4> newOperands(opInst->getOperands());

   for (Value &operand : newOperands) {

     // Replace the subOperands from among the new operands.

     unsigned j, f;

     for (j = 0, f = subOperands.size(); j < f; j++) {

       if (operand == subOperands[j])

         break;

     }

     if (j < subOperands.size())

       operand = (*sliceOps)[j];

   }

   for (unsigned idx = 0, e = newOperands.size(); idx < e; idx++)

     opInst->setOperand(idx, newOperands[idx]);

 }


 /// Enum to set patterns of affine expr in tiled-layout map.

 /// TileFloorDiv: <dim expr> div <tile size>

 /// TileMod: <dim expr> mod <tile size>

 /// TileNone: None of the above

 /// Example:

 /// #tiled_2d_128x256 = affine_map<(d0, d1)

 ///            -> (d0 div 128, d1 div 256, d0 mod 128, d1 mod 256)>

 /// "d0 div 128" and "d1 div 256" ==> TileFloorDiv

 /// "d0 mod 128" and "d1 mod 256" ==> TileMod

 enum TileExprPattern { TileFloorDiv, TileMod, TileNone };


 /// Check if `map` is a tiled layout. In the tiled layout, specific k dimensions

 /// being floordiv'ed by respective tile sizes appeare in a mod with the same

 /// tile sizes, and no other expression involves those k dimensions. This

 /// function stores a vector of tuples (`tileSizePos`) including AffineExpr for

 /// tile size, positions of corresponding `floordiv` and `mod`. If it is not a

 /// tiled layout, an empty vector is returned.

 static LogicalResult getTileSizePos(

     AffineMap map,

     SmallVectorImpl<std::tuple<AffineExpr, unsigned, unsigned>> &tileSizePos) {

   // Create `floordivExprs` which is a vector of tuples including LHS and RHS of

   // `floordiv` and its position in `map` output.

   // Example: #tiled_2d_128x256 = affine_map<(d0, d1)

   //                -> (d0 div 128, d1 div 256, d0 mod 128, d1 mod 256)>

   // In this example, `floordivExprs` includes {d0, 128, 0} and {d1, 256, 1}.

   SmallVector<std::tuple<AffineExpr, AffineExpr, unsigned>, 4> floordivExprs;

   unsigned pos = 0;

   for (AffineExpr expr : map.getResults()) {

     if (expr.getKind() == AffineExprKind::FloorDiv) {

       AffineBinaryOpExpr binaryExpr = cast<AffineBinaryOpExpr>(expr);

       if (isa<AffineConstantExpr>(binaryExpr.getRHS()))

         floordivExprs.emplace_back(

             std::make_tuple(binaryExpr.getLHS(), binaryExpr.getRHS(), pos));

     }

     pos++;

   }

   // Not tiled layout if `floordivExprs` is empty.

   if (floordivExprs.empty()) {

     tileSizePos = SmallVector<std::tuple<AffineExpr, unsigned, unsigned>>{};

     return success();

   }


   // Check if LHS of `floordiv` is used in LHS of `mod`. If not used, `map` is

   // not tiled layout.

   for (std::tuple<AffineExpr, AffineExpr, unsigned> fexpr : floordivExprs) {

     AffineExpr floordivExprLHS = std::get<0>(fexpr);

     AffineExpr floordivExprRHS = std::get<1>(fexpr);

     unsigned floordivPos = std::get<2>(fexpr);


     // Walk affinexpr of `map` output except `fexpr`, and check if LHS and RHS

     // of `fexpr` are used in LHS and RHS of `mod`. If LHS of `fexpr` is used

     // other expr, the map is not tiled layout. Example of non tiled layout:

     //   affine_map<(d0, d1, d2) -> (d0, d1, d2 floordiv 256, d2 floordiv 256)>

     //   affine_map<(d0, d1, d2) -> (d0, d1, d2 floordiv 256, d2 mod 128)>

     //   affine_map<(d0, d1, d2) -> (d0, d1, d2 floordiv 256, d2 mod 256, d2 mod

     //   256)>

     bool found = false;

     pos = 0;

     for (AffineExpr expr : map.getResults()) {

       bool notTiled = false;

       if (pos != floordivPos) {

         expr.walk([&](AffineExpr e) {

           if (e == floordivExprLHS) {

             if (expr.getKind() == AffineExprKind::Mod) {

               AffineBinaryOpExpr binaryExpr = cast<AffineBinaryOpExpr>(expr);

               // If LHS and RHS of `mod` are the same with those of floordiv.

               if (floordivExprLHS == binaryExpr.getLHS() &&

                   floordivExprRHS == binaryExpr.getRHS()) {

                 // Save tile size (RHS of `mod`), and position of `floordiv` and

                 // `mod` if same expr with `mod` is not found yet.

                 if (!found) {

                   tileSizePos.emplace_back(

                       std::make_tuple(binaryExpr.getRHS(), floordivPos, pos));

                   found = true;

                 } else {

                   // Non tiled layout: Have multilpe `mod` with the same LHS.

                   // eg. affine_map<(d0, d1, d2) -> (d0, d1, d2 floordiv 256, d2

                   // mod 256, d2 mod 256)>

                   notTiled = true;

                 }

               } else {

                 // Non tiled layout: RHS of `mod` is different from `floordiv`.

                 // eg. affine_map<(d0, d1, d2) -> (d0, d1, d2 floordiv 256, d2

                 // mod 128)>

                 notTiled = true;

               }

             } else {

               // Non tiled layout: LHS is the same, but not `mod`.

               // eg. affine_map<(d0, d1, d2) -> (d0, d1, d2 floordiv 256, d2

               // floordiv 256)>

               notTiled = true;

             }

           }

         });

       }

       if (notTiled) {

         tileSizePos = SmallVector<std::tuple<AffineExpr, unsigned, unsigned>>{};

         return success();

       }

       pos++;

     }

   }

   return success();

 }


 /// Check if `dim` dimension of memrefType with `layoutMap` becomes dynamic

 /// after normalization. Dimensions that include dynamic dimensions in the map

 /// output will become dynamic dimensions. Return true if `dim` is dynamic

 /// dimension.

 ///

 /// Example:

 /// #map0 = affine_map<(d0, d1) -> (d0, d1 floordiv 32, d1 mod 32)>

 ///

 /// If d1 is dynamic dimension, 2nd and 3rd dimension of map output are dynamic.

 /// memref<4x?xf32, #map0>  ==>  memref<4x?x?xf32>

 static bool

 isNormalizedMemRefDynamicDim(unsigned dim, AffineMap layoutMap,

                              SmallVectorImpl<unsigned> &inMemrefTypeDynDims) {

   AffineExpr expr = layoutMap.getResults()[dim];

   // Check if affine expr of the dimension includes dynamic dimension of input

   // memrefType.

   MLIRContext *context = layoutMap.getContext();

   return expr

       .walk([&](AffineExpr e) {

         if (isa<AffineDimExpr>(e) &&

             llvm::any_of(inMemrefTypeDynDims, [&](unsigned dim) {

               return e == getAffineDimExpr(dim, context);

             }))

           return WalkResult::interrupt();

         return WalkResult::advance();

       })

       .wasInterrupted();

 }


 /// Create affine expr to calculate dimension size for a tiled-layout map.

 static AffineExpr createDimSizeExprForTiledLayout(AffineExpr oldMapOutput,

                                                   TileExprPattern pat) {

   // Create map output for the patterns.

   // "floordiv <tile size>" ==> "ceildiv <tile size>"

   // "mod <tile size>" ==> "<tile size>"

   AffineExpr newMapOutput;

   AffineBinaryOpExpr binaryExpr = nullptr;

   switch (pat) {

   case TileExprPattern::TileMod:

     binaryExpr = cast<AffineBinaryOpExpr>(oldMapOutput);

     newMapOutput = binaryExpr.getRHS();

     break;

   case TileExprPattern::TileFloorDiv:

     binaryExpr = cast<AffineBinaryOpExpr>(oldMapOutput);

     newMapOutput = getAffineBinaryOpExpr(

         AffineExprKind::CeilDiv, binaryExpr.getLHS(), binaryExpr.getRHS());

     break;

   default:

     newMapOutput = oldMapOutput;

   }

   return newMapOutput;

 }


 /// Create new maps to calculate each dimension size of `newMemRefType`, and

 /// create `newDynamicSizes` from them by using AffineApplyOp.

 ///

 /// Steps for normalizing dynamic memrefs for a tiled layout map

 /// Example:

 ///    #map0 = affine_map<(d0, d1) -> (d0, d1 floordiv 32, d1 mod 32)>

 ///    %0 = dim %arg0, %c1 :memref<4x?xf32>

 ///    %1 = alloc(%0) : memref<4x?xf32, #map0>

 ///

 /// (Before this function)

 /// 1. Check if `map`(#map0) is a tiled layout using `getTileSizePos()`. Only

 /// single layout map is supported.

 ///

 /// 2. Create normalized memrefType using `isNormalizedMemRefDynamicDim()`. It

 /// is memref<4x?x?xf32> in the above example.

 ///

 /// (In this function)

 /// 3. Create new maps to calculate each dimension of the normalized memrefType

 /// using `createDimSizeExprForTiledLayout()`. In the tiled layout, the

 /// dimension size can be calculated by replacing "floordiv <tile size>" with

 /// "ceildiv <tile size>" and "mod <tile size>" with "<tile size>".

 /// - New map in the above example

 ///   #map0 = affine_map<(d0, d1) -> (d0)>

 ///   #map1 = affine_map<(d0, d1) -> (d1 ceildiv 32)>

 ///   #map2 = affine_map<(d0, d1) -> (32)>

 ///

 /// 4. Create AffineApplyOp to apply the new maps. The output of AffineApplyOp

 /// is used in dynamicSizes of new AllocOp.

 ///   %0 = dim %arg0, %c1 : memref<4x?xf32>

 ///   %c4 = arith.constant 4 : index

 ///   %1 = affine.apply #map1(%c4, %0)

 ///   %2 = affine.apply #map2(%c4, %0)

 template <typename AllocLikeOp>

 static void createNewDynamicSizes(MemRefType oldMemRefType,

                                   MemRefType newMemRefType, AffineMap map,

                                   AllocLikeOp allocOp, OpBuilder b,

                                   SmallVectorImpl<Value> &newDynamicSizes) {

   // Create new input for AffineApplyOp.

   SmallVector<Value, 4> inAffineApply;

   ArrayRef<int64_t> oldMemRefShape = oldMemRefType.getShape();

   unsigned dynIdx = 0;

   for (unsigned d = 0; d < oldMemRefType.getRank(); ++d) {

     if (oldMemRefShape[d] < 0) {

       // Use dynamicSizes of allocOp for dynamic dimension.

       inAffineApply.emplace_back(allocOp.getDynamicSizes()[dynIdx]);

       dynIdx++;

     } else {

       // Create ConstantOp for static dimension.

       auto constantAttr = b.getIntegerAttr(b.getIndexType(), oldMemRefShape[d]);

       inAffineApply.emplace_back(

           arith::ConstantOp::create(b, allocOp.getLoc(), constantAttr));

     }

   }


   // Create new map to calculate each dimension size of new memref for each

   // original map output. Only for dynamic dimesion of `newMemRefType`.

   unsigned newDimIdx = 0;

   ArrayRef<int64_t> newMemRefShape = newMemRefType.getShape();

   SmallVector<std::tuple<AffineExpr, unsigned, unsigned>> tileSizePos;

   (void)getTileSizePos(map, tileSizePos);

   for (AffineExpr expr : map.getResults()) {

     if (newMemRefShape[newDimIdx] < 0) {

       // Create new maps to calculate each dimension size of new memref.

       enum TileExprPattern pat = TileExprPattern::TileNone;

       for (auto pos : tileSizePos) {

         if (newDimIdx == std::get<1>(pos))

           pat = TileExprPattern::TileFloorDiv;

         else if (newDimIdx == std::get<2>(pos))

           pat = TileExprPattern::TileMod;

       }

       AffineExpr newMapOutput = createDimSizeExprForTiledLayout(expr, pat);

       AffineMap newMap =

           AffineMap::get(map.getNumInputs(), map.getNumSymbols(), newMapOutput);

       Value affineApp =

           AffineApplyOp::create(b, allocOp.getLoc(), newMap, inAffineApply);

       newDynamicSizes.emplace_back(affineApp);

     }

     newDimIdx++;

   }

 }


 template <typename AllocLikeOp>

 LogicalResult mlir::affine::normalizeMemRef(AllocLikeOp allocOp) {

   MemRefType memrefType = allocOp.getType();

   OpBuilder b(allocOp);


   // Fetch a new memref type after normalizing the old memref to have an

   // identity map layout.

   MemRefType newMemRefType = normalizeMemRefType(memrefType);

   if (newMemRefType == memrefType)

     // Either memrefType already had an identity map or the map couldn't be

     // transformed to an identity map.

     return failure();


   Value oldMemRef = allocOp.getResult();


   SmallVector<Value, 4> symbolOperands(allocOp.getSymbolOperands());

   AffineMap layoutMap = memrefType.getLayout().getAffineMap();

   AllocLikeOp newAlloc;

   // Check if `layoutMap` is a tiled layout. Only single layout map is

   // supported for normalizing dynamic memrefs.

   SmallVector<std::tuple<AffineExpr, unsigned, unsigned>> tileSizePos;

   (void)getTileSizePos(layoutMap, tileSizePos);

   if (newMemRefType.getNumDynamicDims() > 0 && !tileSizePos.empty()) {

     auto oldMemRefType = cast<MemRefType>(oldMemRef.getType());

     SmallVector<Value, 4> newDynamicSizes;

     createNewDynamicSizes(oldMemRefType, newMemRefType, layoutMap, allocOp, b,

                           newDynamicSizes);

     // Add the new dynamic sizes in new AllocOp.

     newAlloc = AllocLikeOp::create(b, allocOp.getLoc(), newMemRefType,

                                    newDynamicSizes, allocOp.getAlignmentAttr());

   } else {

     newAlloc = AllocLikeOp::create(b, allocOp.getLoc(), newMemRefType,

                                    allocOp.getAlignmentAttr());

   }

   // Replace all uses of the old memref.

   if (failed(replaceAllMemRefUsesWith(oldMemRef, /*newMemRef=*/newAlloc,

                                       /*extraIndices=*/{},

                                       /*indexRemap=*/layoutMap,

                                       /*extraOperands=*/{},

                                       /*symbolOperands=*/symbolOperands,

                                       /*userFilterFn=*/nullptr,

                                       /*allowNonDereferencingOps=*/true))) {

     // If it failed (due to escapes for example), bail out.

     newAlloc.erase();

     return failure();

   }

   // Replace any uses of the original alloc op and erase it. All remaining uses

   // have to be dealloc's; RAMUW above would've failed otherwise.

   assert(llvm::all_of(oldMemRef.getUsers(), [&](Operation *op) {

     return hasSingleEffect<MemoryEffects::Free>(op, oldMemRef);

   }));

   oldMemRef.replaceAllUsesWith(newAlloc);

   allocOp.erase();

   return success();

 }


 LogicalResult

 mlir::affine::normalizeMemRef(memref::ReinterpretCastOp reinterpretCastOp) {

   MemRefType memrefType = reinterpretCastOp.getType();

   AffineMap oldLayoutMap = memrefType.getLayout().getAffineMap();

   Value oldMemRef = reinterpretCastOp.getResult();


   // If `oldLayoutMap` is identity, `memrefType` is already normalized.

   if (oldLayoutMap.isIdentity())

     return success();


   // Fetch a new memref type after normalizing the old memref to have an

   // identity map layout.

   MemRefType newMemRefType = normalizeMemRefType(memrefType);

   if (newMemRefType == memrefType)

     // `oldLayoutMap` couldn't be transformed to an identity map.

     return failure();


   uint64_t newRank = newMemRefType.getRank();

   SmallVector<Value> mapOperands(oldLayoutMap.getNumDims() +

                                  oldLayoutMap.getNumSymbols());

   SmallVector<Value> oldStrides = reinterpretCastOp.getStrides();

   Location loc = reinterpretCastOp.getLoc();

   // As `newMemRefType` is normalized, it is unit strided.

   SmallVector<int64_t> newStaticStrides(newRank, 1);

   SmallVector<int64_t> newStaticOffsets(newRank, 0);

   ArrayRef<int64_t> oldShape = memrefType.getShape();

   ValueRange oldSizes = reinterpretCastOp.getSizes();

   unsigned idx = 0;

   OpBuilder b(reinterpretCastOp);

   // Collect the map operands which will be used to compute the new normalized

   // memref shape.

   for (unsigned i = 0, e = memrefType.getRank(); i < e; i++) {

     if (memrefType.isDynamicDim(i))

       mapOperands[i] =

           arith::SubIOp::create(b, loc, oldSizes[0].getType(), oldSizes[idx++],

                                 arith::ConstantIndexOp::create(b, loc, 1));

     else

       mapOperands[i] = arith::ConstantIndexOp::create(b, loc, oldShape[i] - 1);

   }

   for (unsigned i = 0, e = oldStrides.size(); i < e; i++)

     mapOperands[memrefType.getRank() + i] = oldStrides[i];

   SmallVector<Value> newSizes;

   ArrayRef<int64_t> newShape = newMemRefType.getShape();

   // Compute size along all the dimensions of the new normalized memref.

   for (unsigned i = 0; i < newRank; i++) {

     if (!newMemRefType.isDynamicDim(i))

       continue;

     newSizes.push_back(AffineApplyOp::create(

         b, loc,

         AffineMap::get(oldLayoutMap.getNumDims(), oldLayoutMap.getNumSymbols(),

                        oldLayoutMap.getResult(i)),

         mapOperands));

   }

   for (unsigned i = 0, e = newSizes.size(); i < e; i++) {

     newSizes[i] =

         arith::AddIOp::create(b, loc, newSizes[i].getType(), newSizes[i],

                               arith::ConstantIndexOp::create(b, loc, 1));

   }

   // Create the new reinterpret_cast op.

   auto newReinterpretCast = memref::ReinterpretCastOp::create(

       b, loc, newMemRefType, reinterpretCastOp.getSource(),

       /*offsets=*/ValueRange(), newSizes,

       /*strides=*/ValueRange(),

       /*static_offsets=*/newStaticOffsets,

       /*static_sizes=*/newShape,

       /*static_strides=*/newStaticStrides);


   // Replace all uses of the old memref.

   if (failed(replaceAllMemRefUsesWith(oldMemRef,

                                       /*newMemRef=*/newReinterpretCast,

                                       /*extraIndices=*/{},

                                       /*indexRemap=*/oldLayoutMap,

                                       /*extraOperands=*/{},

                                       /*symbolOperands=*/oldStrides,

                                       /*userFilterFn=*/nullptr,

                                       /*allowNonDereferencingOps=*/true))) {

     // If it failed (due to escapes for example), bail out.

     newReinterpretCast.erase();

     return failure();

   }


   oldMemRef.replaceAllUsesWith(newReinterpretCast);

   reinterpretCastOp.erase();

   return success();

 }


 template LogicalResult

 mlir::affine::normalizeMemRef<memref::AllocaOp>(memref::AllocaOp op);

 template LogicalResult

 mlir::affine::normalizeMemRef<memref::AllocOp>(memref::AllocOp op);


 MemRefType mlir::affine::normalizeMemRefType(MemRefType memrefType) {

   unsigned rank = memrefType.getRank();

   if (rank == 0)

     return memrefType;


   if (memrefType.getLayout().isIdentity()) {

     // Either no maps is associated with this memref or this memref has

     // a trivial (identity) map.

     return memrefType;

   }

   AffineMap layoutMap = memrefType.getLayout().getAffineMap();

   unsigned numSymbolicOperands = layoutMap.getNumSymbols();


   // We don't do any checks for one-to-one'ness; we assume that it is

   // one-to-one.


   // Normalize only static memrefs and dynamic memrefs with a tiled-layout map

   // for now.

   // TODO: Normalize the other types of dynamic memrefs.

   SmallVector<std::tuple<AffineExpr, unsigned, unsigned>> tileSizePos;

   (void)getTileSizePos(layoutMap, tileSizePos);

   if (memrefType.getNumDynamicDims() > 0 && tileSizePos.empty())

     return memrefType;


   // We have a single map that is not an identity map. Create a new memref

   // with the right shape and an identity layout map.

   ArrayRef<int64_t> shape = memrefType.getShape();

   // FlatAffineValueConstraint may later on use symbolicOperands.

   FlatAffineValueConstraints fac(rank, numSymbolicOperands);

   SmallVector<unsigned, 4> memrefTypeDynDims;

   for (unsigned d = 0; d < rank; ++d) {

     // Use constraint system only in static dimensions.

     if (shape[d] > 0) {

       fac.addBound(BoundType::LB, d, 0);

       fac.addBound(BoundType::UB, d, shape[d] - 1);

     } else {

       memrefTypeDynDims.emplace_back(d);

     }

   }

   // We compose this map with the original index (logical) space to derive

   // the upper bounds for the new index space.

   unsigned newRank = layoutMap.getNumResults();

   if (failed(fac.composeMatchingMap(layoutMap)))

     return memrefType;

   // TODO: Handle semi-affine maps.

   // Project out the old data dimensions.

   fac.projectOut(newRank, fac.getNumVars() - newRank - fac.getNumLocalVars());

   SmallVector<int64_t, 4> newShape(newRank);

   MLIRContext *context = memrefType.getContext();

   for (unsigned d = 0; d < newRank; ++d) {

     // Check if this dimension is dynamic.

     if (isNormalizedMemRefDynamicDim(d, layoutMap, memrefTypeDynDims)) {

       newShape[d] = ShapedType::kDynamic;

       continue;

     }

     // The lower bound for the shape is always zero.

     std::optional<int64_t> ubConst = fac.getConstantBound64(BoundType::UB, d);

     // For a static memref and an affine map with no symbols, this is

     // always bounded. However, when we have symbols, we may not be able to

     // obtain a constant upper bound. Also, mapping to a negative space is

     // invalid for normalization.

     if (!ubConst.has_value() || *ubConst < 0) {

       LLVM_DEBUG(llvm::dbgs()

                  << "can't normalize map due to unknown/invalid upper bound");

       return memrefType;

     }

     // If dimension of new memrefType is dynamic, the value is -1.

     newShape[d] = *ubConst + 1;

   }


   // Create the new memref type after trivializing the old layout map.

   auto newMemRefType =

       MemRefType::Builder(memrefType)

           .setShape(newShape)

           .setLayout(AffineMapAttr::get(

               AffineMap::getMultiDimIdentityMap(newRank, context)));

   return newMemRefType;

 }


 DivModValue mlir::affine::getDivMod(OpBuilder &b, Location loc, Value lhs,

                                     Value rhs) {

   DivModValue result;

   AffineExpr d0, d1;

   bindDims(b.getContext(), d0, d1);

   result.quotient =

       affine::makeComposedAffineApply(b, loc, d0.floorDiv(d1), {lhs, rhs});

   result.remainder =

       affine::makeComposedAffineApply(b, loc, d0 % d1, {lhs, rhs});

   return result;

 }


 /// Create an affine map that computes `lhs` * `rhs`, composing in any other

 /// affine maps.

 static FailureOr<OpFoldResult> composedAffineMultiply(OpBuilder &b,

                                                       Location loc,

                                                       OpFoldResult lhs,

                                                       OpFoldResult rhs) {

   AffineExpr s0, s1;

   bindSymbols(b.getContext(), s0, s1);

   return makeComposedFoldedAffineApply(b, loc, s0 * s1, {lhs, rhs});

 }


 FailureOr<SmallVector<Value>>

 mlir::affine::delinearizeIndex(OpBuilder &b, Location loc, Value linearIndex,

                                ArrayRef<Value> basis, bool hasOuterBound) {

   if (hasOuterBound)

     basis = basis.drop_front();


   // Note: the divisors are backwards due to the scan.

   SmallVector<Value> divisors;

   OpFoldResult basisProd = b.getIndexAttr(1);

   for (OpFoldResult basisElem : llvm::reverse(basis)) {

     FailureOr<OpFoldResult> nextProd =

         composedAffineMultiply(b, loc, basisElem, basisProd);

     if (failed(nextProd))

       return failure();

     basisProd = *nextProd;

     divisors.push_back(getValueOrCreateConstantIndexOp(b, loc, basisProd));

   }


   SmallVector<Value> results;

   results.reserve(divisors.size() + 1);

   Value residual = linearIndex;

   for (Value divisor : llvm::reverse(divisors)) {

     DivModValue divMod = getDivMod(b, loc, residual, divisor);

     results.push_back(divMod.quotient);

     residual = divMod.remainder;

   }

   results.push_back(residual);

   return results;

 }


 FailureOr<SmallVector<Value>>

 mlir::affine::delinearizeIndex(OpBuilder &b, Location loc, Value linearIndex,

                                ArrayRef<OpFoldResult> basis,

                                bool hasOuterBound) {

   if (hasOuterBound)

     basis = basis.drop_front();


   // Note: the divisors are backwards due to the scan.

   SmallVector<Value> divisors;

   OpFoldResult basisProd = b.getIndexAttr(1);

   for (OpFoldResult basisElem : llvm::reverse(basis)) {

     FailureOr<OpFoldResult> nextProd =

         composedAffineMultiply(b, loc, basisElem, basisProd);

     if (failed(nextProd))

       return failure();

     basisProd = *nextProd;

     divisors.push_back(getValueOrCreateConstantIndexOp(b, loc, basisProd));

   }


   SmallVector<Value> results;

   results.reserve(divisors.size() + 1);

   Value residual = linearIndex;

   for (Value divisor : llvm::reverse(divisors)) {

     DivModValue divMod = getDivMod(b, loc, residual, divisor);

     results.push_back(divMod.quotient);

     residual = divMod.remainder;

   }

   results.push_back(residual);

   return results;

 }


 OpFoldResult mlir::affine::linearizeIndex(ArrayRef<OpFoldResult> multiIndex,

                                           ArrayRef<OpFoldResult> basis,

                                           ImplicitLocOpBuilder &builder) {

   return linearizeIndex(builder, builder.getLoc(), multiIndex, basis);

 }


 OpFoldResult mlir::affine::linearizeIndex(OpBuilder &builder, Location loc,

                                           ArrayRef<OpFoldResult> multiIndex,

                                           ArrayRef<OpFoldResult> basis) {

   assert(multiIndex.size() == basis.size() ||

          multiIndex.size() == basis.size() + 1);

   SmallVector<AffineExpr> basisAffine;


   // Add a fake initial size in order to make the later index linearization

   // computations line up if an outer bound is not provided.

   if (multiIndex.size() == basis.size() + 1)

     basisAffine.push_back(getAffineConstantExpr(1, builder.getContext()));


   for (size_t i = 0; i < basis.size(); ++i) {

     basisAffine.push_back(getAffineSymbolExpr(i, builder.getContext()));

   }


   SmallVector<AffineExpr> stridesAffine = computeStrides(basisAffine);

   SmallVector<OpFoldResult> strides;

   strides.reserve(stridesAffine.size());

   llvm::transform(stridesAffine, std::back_inserter(strides),

                   [&builder, &basis, loc](AffineExpr strideExpr) {

                     return affine::makeComposedFoldedAffineApply(

                         builder, loc, strideExpr, basis);

                   });


   auto &&[linearIndexExpr, multiIndexAndStrides] = computeLinearIndex(

       OpFoldResult(builder.getIndexAttr(0)), strides, multiIndex);

   return affine::makeComposedFoldedAffineApply(builder, loc, linearIndexExpr,

                                                multiIndexAndStrides);

 }

AffineExprVisitor.h

AffineOps.h

AffineValueMap.h

Utils.h

mayHaveEffect
static bool mayHaveEffect(Operation *srcMemOp, Operation *destMemOp, unsigned minSurroundingLoops)
Returns true if srcMemOp may have an effect on destMemOp within the scope of the outermost minSurroun...
Definition: Utils.cpp:654

createNewDynamicSizes
static void createNewDynamicSizes(MemRefType oldMemRefType, MemRefType newMemRefType, AffineMap map, AllocLikeOp allocOp, OpBuilder b, SmallVectorImpl< Value > &newDynamicSizes)
Create new maps to calculate each dimension size of newMemRefType, and create newDynamicSizes from th...
Definition: Utils.cpp:1669

isDereferencingOp
static bool isDereferencingOp(Operation *op)
Definition: Utils.cpp:1104

getTileSizePos
static LogicalResult getTileSizePos(AffineMap map, SmallVectorImpl< std::tuple< AffineExpr, unsigned, unsigned >> &tileSizePos)
Check if map is a tiled layout.
Definition: Utils.cpp:1495

TileExprPattern
TileExprPattern
Enum to set patterns of affine expr in tiled-layout map.
Definition: Utils.cpp:1487

TileFloorDiv
@ TileFloorDiv
Definition: Utils.cpp:1487

TileNone
@ TileNone
Definition: Utils.cpp:1487

TileMod
@ TileMod
Definition: Utils.cpp:1487

promoteIfBlock
static void promoteIfBlock(AffineIfOp ifOp, bool elseBlock)
Promotes the then or the else block of ifOp (depending on whether elseBlock is false or true) into if...
Definition: Utils.cpp:246

isNormalizedMemRefDynamicDim
static bool isNormalizedMemRefDynamicDim(unsigned dim, AffineMap layoutMap, SmallVectorImpl< unsigned > &inMemrefTypeDynDims)
Check if dim dimension of memrefType with layoutMap becomes dynamic after normalization.
Definition: Utils.cpp:1594

composedAffineMultiply
static FailureOr< OpFoldResult > composedAffineMultiply(OpBuilder &b, Location loc, OpFoldResult lhs, OpFoldResult rhs)
Create an affine map that computes lhs * rhs, composing in any other affine maps.
Definition: Utils.cpp:1957

loadCSE
static void loadCSE(AffineReadOpInterface loadA, SmallVectorImpl< Operation * > &loadOpsToErase, DominanceInfo &domInfo, llvm::function_ref< bool(Value, Value)> mayAlias)
Definition: Utils.cpp:959

createDimSizeExprForTiledLayout
static AffineExpr createDimSizeExprForTiledLayout(AffineExpr oldMapOutput, TileExprPattern pat)
Create affine expr to calculate dimension size for a tiled-layout map.
Definition: Utils.cpp:1613

getOutermostInvariantForOp
static Operation * getOutermostInvariantForOp(AffineIfOp ifOp)
Returns the outermost affine.for/parallel op that the ifOp is invariant on.
Definition: Utils.cpp:262

findUnusedStore
static void findUnusedStore(AffineWriteOpInterface writeA, SmallVectorImpl< Operation * > &opsToErase, PostDominanceInfo &postDominanceInfo, llvm::function_ref< bool(Value, Value)> mayAlias)
Definition: Utils.cpp:912

mustReachAtInnermost
static bool mustReachAtInnermost(const MemRefAccess &srcAccess, const MemRefAccess &destAccess)
Returns true if the memory operation of destAccess depends on srcAccess inside of the innermost commo...
Definition: Utils.cpp:636

forwardStoreToLoad
static void forwardStoreToLoad(AffineReadOpInterface loadOp, SmallVectorImpl< Operation * > &loadOpsToErase, SmallPtrSetImpl< Value > &memrefsToErase, DominanceInfo &domInfo, llvm::function_ref< bool(Value, Value)> mayAlias)
Attempt to eliminate loadOp by replacing it with a value stored into memory which the load is guarant...
Definition: Utils.cpp:835

Utils.h

Utils.h

visit
static void visit(Operation *op, DenseSet< Operation * > &visited)
Visits all the pdl.operand(s), pdl.result(s), and pdl.operation(s) connected to the given operation.
Definition: PDL.cpp:62

Dominance.h

mayAlias
static bool mayAlias(Value first, Value second)
Returns true if two values may be referencing aliasing memory.
Definition: EliminateBarriers.cpp:424

FuncOps.h

GreedyPatternRewriteDriver.h

IRMapping.h

IndexingUtils.h

LoopUtils.h

max
static Value max(ImplicitLocOpBuilder &builder, Value value, Value bound)
Definition: PolynomialApproximation.cpp:212

min
static Value min(ImplicitLocOpBuilder &builder, Value value, Value bound)
Definition: PolynomialApproximation.cpp:204

llvm::ArrayRef
Definition: LLVM.h:48

llvm::DenseSet
Definition: LLVM.h:59

llvm::SmallPtrSetImpl
Definition: LLVM.h:70

llvm::SmallPtrSet
Definition: LLVM.h:68

llvm::SmallVectorImpl
Definition: LLVM.h:74

llvm::SmallVector
Definition: LLVM.h:72

llvm::function_ref
Definition: LLVM.h:90

mlir::AffineBinaryOpExpr
Affine binary operation expression.
Definition: AffineExpr.h:214

mlir::AffineBinaryOpExpr::getLHS
AffineExpr getLHS() const
Definition: AffineExpr.cpp:338

mlir::AffineBinaryOpExpr::getRHS
AffineExpr getRHS() const
Definition: AffineExpr.cpp:341

mlir::AffineConstantExpr
An integer constant appearing in affine expression.
Definition: AffineExpr.h:239

mlir::AffineConstantExpr::getValue
int64_t getValue() const
Definition: AffineExpr.cpp:635

mlir::AffineDimExpr
A dimensional identifier appearing in an affine expression.
Definition: AffineExpr.h:223

mlir::AffineDimExpr::getPosition
unsigned getPosition() const
Definition: AffineExpr.cpp:346

mlir::AffineExprVisitor
See documentation for AffineExprVisitorBase.
Definition: AffineExprVisitor.h:144

mlir::AffineExpr
Base type for affine expression.
Definition: AffineExpr.h:68

mlir::AffineExpr::floorDiv
AffineExpr floorDiv(uint64_t v) const
Definition: AffineExpr.cpp:959

mlir::AffineExpr::walk
RetT walk(FnT &&callback) const
Walk all of the AffineExpr's in this expression in postorder.
Definition: AffineExpr.h:117

mlir::AffineExpr::ceilDiv
AffineExpr ceilDiv(uint64_t v) const
Definition: AffineExpr.cpp:1006

mlir::AffineMap
A multi-dimensional affine map Affine map's are immutable like Type's, and they are uniqued.
Definition: AffineMap.h:46

mlir::AffineMap::getContext
MLIRContext * getContext() const
Definition: AffineMap.cpp:339

mlir::AffineMap::getMultiDimIdentityMap
static AffineMap getMultiDimIdentityMap(unsigned numDims, MLIRContext *context)
Returns an AffineMap with 'numDims' identity result dim exprs.
Definition: AffineMap.cpp:330

mlir::AffineMap::get
static AffineMap get(MLIRContext *context)
Returns a zero result affine map with no dimensions or symbols: () -> ().
Definition: MLIRContext.cpp:1224

mlir::AffineMap::getNumSymbols
unsigned getNumSymbols() const
Definition: AffineMap.cpp:394

mlir::AffineMap::getNumDims
unsigned getNumDims() const
Definition: AffineMap.cpp:390

mlir::AffineMap::getResults
ArrayRef< AffineExpr > getResults() const
Definition: AffineMap.cpp:403

mlir::AffineMap::getNumResults
unsigned getNumResults() const
Definition: AffineMap.cpp:398

mlir::AffineMap::getNumInputs
unsigned getNumInputs() const
Definition: AffineMap.cpp:399

mlir::AffineMap::getResult
AffineExpr getResult(unsigned idx) const
Definition: AffineMap.cpp:407

mlir::AffineMap::compose
AffineMap compose(AffineMap map) const
Returns the AffineMap resulting from composing this with map.
Definition: AffineMap.cpp:552

mlir::AffineMap::isIdentity
bool isIdentity() const
Returns true if this affine map is an identity affine map.
Definition: AffineMap.cpp:341

mlir::AffineSymbolExpr
A symbolic identifier appearing in an affine expression.
Definition: AffineExpr.h:231

mlir::AffineSymbolExpr::getPosition
unsigned getPosition() const
Definition: AffineExpr.cpp:625

mlir::AliasAnalysis
This class represents the main alias analysis interface in MLIR.
Definition: AliasAnalysis.h:232

mlir::AliasAnalysis::alias
AliasResult alias(Value lhs, Value rhs)
Given two values, return their aliasing behavior.
Definition: AliasAnalysis.cpp:80

mlir::AliasResult::isNo
bool isNo() const
Returns if this result indicates no possibility of aliasing.
Definition: AliasAnalysis.h:59

mlir::BlockArgument
This class represents an argument of a Block.
Definition: Value.h:309

mlir::Block
Block represents an ordered list of Operations.
Definition: Block.h:33

mlir::Block::iterator
OpListType::iterator iterator
Definition: Block.h:140

mlir::Block::getSuccessors
SuccessorRange getSuccessors()
Definition: Block.h:270

mlir::Block::getTerminator
Operation * getTerminator()
Get the terminator operation of this block.
Definition: Block.cpp:244

mlir::Block::getOperations
OpListType & getOperations()
Definition: Block.h:137

mlir::Block::end
iterator end()
Definition: Block.h:144

mlir::Block::begin
iterator begin()
Definition: Block.h:143

mlir::Builder::getIndexAttr
IntegerAttr getIndexAttr(int64_t value)
Definition: Builders.cpp:108

mlir::Builder::getIntegerAttr
IntegerAttr getIntegerAttr(Type type, int64_t value)
Definition: Builders.cpp:228

mlir::Builder::getMultiDimIdentityMap
AffineMap getMultiDimIdentityMap(unsigned rank)
Definition: Builders.cpp:387

mlir::Builder::getBoolAttr
BoolAttr getBoolAttr(bool value)
Definition: Builders.cpp:100

mlir::Builder::getStringAttr
StringAttr getStringAttr(const Twine &bytes)
Definition: Builders.cpp:262

mlir::Builder::getAffineDimExpr
AffineExpr getAffineDimExpr(unsigned position)
Definition: Builders.cpp:364

mlir::Builder::getConstantAffineMap
AffineMap getConstantAffineMap(int64_t val)
Returns a single constant result affine map with 0 dimensions and 0 symbols.
Definition: Builders.cpp:378

mlir::Builder::getContext
MLIRContext * getContext() const
Definition: Builders.h:56

mlir::Builder::getIndexType
IndexType getIndexType()
Definition: Builders.cpp:51

mlir::DominanceInfo
A class for computing basic dominance information.
Definition: Dominance.h:140

mlir::DominanceInfo::dominates
bool dominates(Operation *a, Operation *b) const
Return true if operation A dominates operation B, i.e.
Definition: Dominance.h:158

mlir::FlatLinearConstraints::composeMatchingMap
LogicalResult composeMatchingMap(AffineMap other)
Composes an affine map whose dimensions and symbols match one to one with the dimensions and symbols ...
Definition: FlatLinearValueConstraints.cpp:226

mlir::FlatLinearValueConstraints::projectOut
void projectOut(Value val)
Projects out the variable that is associate with Value.
Definition: FlatLinearValueConstraints.cpp:1482

mlir::FrozenRewritePatternSet
This class represents a frozen set of patterns that can be processed by a pattern applicator.
Definition: FrozenRewritePatternSet.h:24

mlir::GreedyRewriteConfig
This class allows control over how the GreedyPatternRewriteDriver works.
Definition: GreedyPatternRewriteDriver.h:43

mlir::GreedyRewriteConfig::setStrictness
GreedyRewriteConfig & setStrictness(GreedyRewriteStrictness mode)
Definition: GreedyPatternRewriteDriver.h:113

mlir::IRMapping
This is a utility class for mapping one set of IR entities to another.
Definition: IRMapping.h:26

mlir::IRMapping::clear
void clear()
Clears all mappings held by the mapper.
Definition: IRMapping.h:79

mlir::ImplicitLocOpBuilder
ImplicitLocOpBuilder maintains a 'current location', allowing use of the create<> method without spec...
Definition: Builders.h:629

mlir::ImplicitLocOpBuilder::getLoc
Location getLoc() const
Accessors for the implied location.
Definition: Builders.h:662

mlir::Location
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
Definition: Location.h:76

mlir::MLIRContext
MLIRContext is the top-level object for a collection of MLIR operations.
Definition: MLIRContext.h:63

mlir::MemRefType::Builder
This is a builder type that keeps local references to arguments.
Definition: BuiltinTypes.h:182

mlir::MemRefType::Builder::setLayout
Builder & setLayout(MemRefLayoutAttrInterface newLayout)
Definition: BuiltinTypes.h:203

mlir::MemRefType::Builder::setShape
Builder & setShape(ArrayRef< int64_t > newShape)
Definition: BuiltinTypes.h:193

mlir::NamedAttribute
NamedAttribute represents a combination of a name and an Attribute value.
Definition: Attributes.h:164

mlir::NamedAttribute::getValue
Attribute getValue() const
Return the value of the attribute.
Definition: Attributes.h:179

mlir::OpBuilder
This class helps build Operations.
Definition: Builders.h:207

mlir::OpBuilder::atBlockBegin
static OpBuilder atBlockBegin(Block *block, Listener *listener=nullptr)
Create a builder and set the insertion point to before the first operation in the block but still ins...
Definition: Builders.h:240

mlir::OpBuilder::getInsertionPoint
Block::iterator getInsertionPoint() const
Returns the current insertion point of the builder.
Definition: Builders.h:445

mlir::OpBuilder::clone
Operation * clone(Operation &op, IRMapping &mapper)
Creates a deep copy of the specified operation, remapping any operands that use values outside of the...
Definition: Builders.cpp:562

mlir::OpBuilder::setInsertionPointToStart
void setInsertionPointToStart(Block *block)
Sets the insertion point to the start of the specified block.
Definition: Builders.h:431

mlir::OpBuilder::create
Operation * create(const OperationState &state)
Creates an operation given the fields represented as an OperationState.
Definition: Builders.cpp:457

mlir::OpBuilder::setInsertionPointAfter
void setInsertionPointAfter(Operation *op)
Sets the insertion point to the node after the specified operation, which will cause subsequent inser...
Definition: Builders.h:412

mlir::OpBuilder::getInsertionBlock
Block * getInsertionBlock() const
Return the block the current insertion point belongs to.
Definition: Builders.h:442

mlir::OpFoldResult
This class represents a single result from folding an operation.
Definition: OpDefinition.h:272

mlir::OpTrait::HasRecursiveMemoryEffects
This trait indicates that the memory effects of an operation includes the effects of operations neste...
Definition: SideEffectInterfaces.h:317

mlir::OpTrait::IsIsolatedFromAbove
This class provides the API for ops that are known to be isolated from above.
Definition: OpDefinition.h:1261

mlir::OperandRange
This class implements the operand iterators for the Operation class.
Definition: ValueRange.h:43

mlir::Operation
Operation is the basic unit of execution within MLIR.
Definition: Operation.h:88

mlir::Operation::getOperand
Value getOperand(unsigned idx)
Definition: Operation.h:350

mlir::Operation::hasTrait
bool hasTrait()
Returns true if the operation was registered with a particular trait, e.g.
Definition: Operation.h:749

mlir::Operation::setOperand
void setOperand(unsigned idx, Value value)
Definition: Operation.h:351

mlir::Operation::operand_begin
operand_iterator operand_begin()
Definition: Operation.h:374

mlir::Operation::getResult
OpResult getResult(unsigned idx)
Get the 'idx'th result of this operation.
Definition: Operation.h:407

mlir::Operation::walk
std::enable_if_t< llvm::function_traits< std::decay_t< FnT > >::num_args==1, RetT > walk(FnT &&callback)
Walk the operation by calling the callback for each nested operation (including this one),...
Definition: Operation.h:797

mlir::Operation::getLoc
Location getLoc()
The source location the operation was defined or derived from.
Definition: Operation.h:223

mlir::Operation::getNumOperands
unsigned getNumOperands()
Definition: Operation.h:346

mlir::Operation::getParentOp
Operation * getParentOp()
Returns the closest surrounding operation that contains this operation or nullptr if this is a top-le...
Definition: Operation.h:234

mlir::Operation::getAttrs
ArrayRef< NamedAttribute > getAttrs()
Return all of the attributes on this operation.
Definition: Operation.h:512

mlir::Operation::getBlock
Block * getBlock()
Returns the operation block that contains this operation.
Definition: Operation.h:213

mlir::Operation::operand_end
operand_iterator operand_end()
Definition: Operation.h:375

mlir::Operation::getName
OperationName getName()
The name of an operation is the key identifier for it.
Definition: Operation.h:119

mlir::Operation::getOperands
operand_range getOperands()
Returns an iterator on the underlying Value's.
Definition: Operation.h:378

mlir::Operation::isAncestor
bool isAncestor(Operation *other)
Return true if this operation is an ancestor of the other operation.
Definition: Operation.h:263

mlir::Operation::replaceAllUsesWith
void replaceAllUsesWith(ValuesT &&values)
Replace all uses of results of this operation with the provided 'values'.
Definition: Operation.h:272

mlir::Operation::setOperands
void setOperands(ValueRange operands)
Replace the current operands of this operation with the ones provided in 'operands'.
Definition: Operation.cpp:237

mlir::Operation::getUsers
user_range getUsers()
Returns a range of all users.
Definition: Operation.h:873

mlir::Operation::getParentRegion
Region * getParentRegion()
Returns the region to which the instruction belongs.
Definition: Operation.h:230

mlir::Operation::getResults
result_range getResults()
Definition: Operation.h:415

mlir::Operation::erase
void erase()
Remove this operation from its parent block and delete it.
Definition: Operation.cpp:539

mlir::Operation::getNumResults
unsigned getNumResults()
Return the number of results held by this operation.
Definition: Operation.h:404

mlir::PostDominanceInfo
A class for computing basic postdominance information.
Definition: Dominance.h:204

mlir::PostDominanceInfo::postDominates
bool postDominates(Operation *a, Operation *b) const
Return true if operation A postdominates operation B.
Definition: Dominance.h:213

mlir::Region
This class contains a list of basic blocks and a link to the parent operation it is attached to.
Definition: Region.h:26

mlir::Region::getParentRegion
Region * getParentRegion()
Return the region containing this region or nullptr if the region is attached to a top-level operatio...
Definition: Region.cpp:45

mlir::Region::isAncestor
bool isAncestor(Region *other)
Return true if this region is ancestor of the other region.
Definition: Region.h:222

mlir::RewritePatternSet
Definition: PatternMatch.h:816

mlir::ValueRange
This class provides an abstraction over the different types of ranges over Values.
Definition: ValueRange.h:387

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

mlir::Value::getType
Type getType() const
Return the type of this value.
Definition: Value.h:105

mlir::Value::replaceAllUsesExcept
void replaceAllUsesExcept(Value newValue, const SmallPtrSetImpl< Operation * > &exceptions)
Replace all uses of 'this' value with 'newValue', updating anything in the IR that uses 'this' to use...
Definition: Value.cpp:71

mlir::Value::replaceAllUsesWith
void replaceAllUsesWith(Value newValue)
Replace all uses of 'this' value with the new value, updating anything in the IR that uses 'this' to ...
Definition: Value.h:149

mlir::Value::getUsers
user_range getUsers() const
Definition: Value.h:218

mlir::Value::getDefiningOp
Operation * getDefiningOp() const
If this value is the result of an operation, return the operation that defines it.
Definition: Value.cpp:18

mlir::WalkResult::advance
static WalkResult advance()
Definition: WalkResult.h:47

mlir::WalkResult::interrupt
static WalkResult interrupt()
Definition: WalkResult.h:46

mlir::affine::AffineValueMap
An AffineValueMap is an affine map plus its ML value operands and results for analysis purposes.
Definition: AffineValueMap.h:35

mlir::affine::AffineValueMap::canonicalize
LogicalResult canonicalize()
Attempts to canonicalize the map and operands.
Definition: AffineOps.cpp:4329

mlir::affine::AffineValueMap::getNumSymbols
unsigned getNumSymbols() const
Definition: AffineValueMap.h:76

mlir::affine::AffineValueMap::getOperands
ArrayRef< Value > getOperands() const
Definition: AffineValueMap.cpp:106

mlir::affine::AffineValueMap::getNumDims
unsigned getNumDims() const
Definition: AffineValueMap.h:75

mlir::affine::AffineValueMap::getResult
AffineExpr getResult(unsigned i)
Definition: AffineValueMap.h:73

mlir::affine::AffineValueMap::getAffineMap
AffineMap getAffineMap() const
Definition: AffineValueMap.cpp:110

mlir::affine::AffineValueMap::getNumResults
unsigned getNumResults() const
Definition: AffineValueMap.h:77

mlir::affine::AffineValueMap::difference
static void difference(const AffineValueMap &a, const AffineValueMap &b, AffineValueMap *res)
Return the value map that is the difference of value maps 'a' and 'b', represented as an affine map a...
Definition: AffineValueMap.cpp:36

mlir::affine::FlatAffineValueConstraints
FlatAffineValueConstraints is an extension of FlatLinearValueConstraints with helper functions for Af...
Definition: AffineStructures.h:44

mlir::affine::FlatAffineValueConstraints::addBound
LogicalResult addBound(presburger::BoundType type, unsigned pos, AffineMap boundMap, ValueRange operands)
Adds a bound for the variable at the specified position with constraints being drawn from the specifi...
Definition: AffineStructures.cpp:220

mlir::arith::ConstantIndexOp::create
static ConstantIndexOp create(OpBuilder &builder, Location location, int64_t value)
Definition: ArithOps.cpp:359

mlir::presburger::IntegerRelation::getConstantBound64
std::optional< int64_t > getConstantBound64(BoundType type, unsigned pos) const
The same, but casts to int64_t.
Definition: IntegerRelation.h:591

mlir::presburger::IntegerRelation::getNumVars
unsigned getNumVars() const
Definition: IntegerRelation.h:221

mlir::presburger::IntegerRelation::getNumLocalVars
unsigned getNumLocalVars() const
Definition: IntegerRelation.h:215

MemRef.h

IntegerSet.h

mlir::affine::expandAffineMap
std::optional< SmallVector< Value, 8 > > expandAffineMap(OpBuilder &builder, Location loc, AffineMap affineMap, ValueRange operands)
Create a sequence of operations that implement the affineMap applied to the given operands (as it it ...
Definition: Utils.cpp:228

mlir::affine::makeComposedAffineApply
AffineApplyOp makeComposedAffineApply(OpBuilder &b, Location loc, AffineMap map, ArrayRef< OpFoldResult > operands, bool composeAffineMin=false)
Returns a composed AffineApplyOp by composing map and operands with other AffineApplyOps supplying th...
Definition: AffineOps.cpp:1416

mlir::affine::affineScalarReplace
void affineScalarReplace(func::FuncOp f, DominanceInfo &domInfo, PostDominanceInfo &postDomInfo, AliasAnalysis &analysis)
Replace affine store and load accesses by scalars by forwarding stores to loads and eliminate invaria...
Definition: Utils.cpp:1040

mlir::affine::promoteIfSingleIteration
LogicalResult promoteIfSingleIteration(AffineForOp forOp)
Promotes the loop body of a AffineForOp to its containing block if the loop was known to have a singl...
Definition: LoopUtils.cpp:119

mlir::affine::isValidDim
bool isValidDim(Value value)
Returns true if the given Value can be used as a dimension id in the region of the closest surroundin...
Definition: AffineOps.cpp:290

mlir::affine::expandAffineExpr
Value expandAffineExpr(OpBuilder &builder, Location loc, AffineExpr expr, ValueRange dimValues, ValueRange symbolValues)
Emit code that computes the given affine expression using standard arithmetic operations applied to t...
Definition: Utils.cpp:218

mlir::affine::getNumCommonSurroundingLoops
unsigned getNumCommonSurroundingLoops(Operation &a, Operation &b)
Returns the number of surrounding loops common to both A and B.
Definition: Utils.cpp:2108

mlir::affine::normalizeAffineParallel
void normalizeAffineParallel(AffineParallelOp op)
Normalize a affine.parallel op so that lower bounds are 0 and steps are 1.
Definition: Utils.cpp:494

mlir::affine::checkMemrefAccessDependence
DependenceResult checkMemrefAccessDependence(const MemRefAccess &srcAccess, const MemRefAccess &dstAccess, unsigned loopDepth, FlatAffineValueConstraints *dependenceConstraints=nullptr, SmallVector< DependenceComponent, 2 > *dependenceComponents=nullptr, bool allowRAR=false)
Definition: AffineAnalysis.cpp:608

mlir::affine::affineParallelize
LogicalResult affineParallelize(AffineForOp forOp, ArrayRef< LoopReduction > parallelReductions={}, AffineParallelOp *resOp=nullptr)
Replaces a parallel affine.for op with a 1-d affine.parallel op.
Definition: Utils.cpp:352

mlir::affine::canonicalizeMapAndOperands
void canonicalizeMapAndOperands(AffineMap *map, SmallVectorImpl< Value > *operands)
Modifies both map and operands in-place so as to:
Definition: AffineOps.cpp:1759

mlir::affine::getReachableAffineApplyOps
void getReachableAffineApplyOps(ArrayRef< Value > operands, SmallVectorImpl< Operation * > &affineApplyOps)
Returns in affineApplyOps, the sequence of those AffineApplyOp Operations that are reachable via a se...
Definition: AffineAnalysis.cpp:189

mlir::affine::makeComposedFoldedAffineApply
OpFoldResult makeComposedFoldedAffineApply(OpBuilder &b, Location loc, AffineMap map, ArrayRef< OpFoldResult > operands, bool composeAffineMin=false)
Constructs an AffineApplyOp that applies map to operands after composing the map with the maps of any...
Definition: AffineOps.cpp:1469

mlir::affine::normalizeAffineFor
LogicalResult normalizeAffineFor(AffineForOp op, bool promoteSingleIter=false)
Normalize an affine.for op.
Definition: Utils.cpp:559

mlir::affine::getAffineAnalysisScope
Region * getAffineAnalysisScope(Operation *op)
Returns the closest region enclosing op that is held by a non-affine operation; nullptr if there is n...
Definition: AffineOps.cpp:275

mlir::affine::fullyComposeAffineMapAndOperands
void fullyComposeAffineMapAndOperands(AffineMap *map, SmallVectorImpl< Value > *operands, bool composeAffineMin=false)
Given an affine map map and its input operands, this method composes into map, maps of AffineApplyOps...
Definition: AffineOps.cpp:1400

mlir::affine::isValidSymbol
bool isValidSymbol(Value value)
Returns true if the given value can be used as a symbol in the region of the closest surrounding op t...
Definition: AffineOps.cpp:412

mlir::affine::hasDependence
bool hasDependence(DependenceResult result)
Utility function that returns true if the provided DependenceResult corresponds to a dependence resul...
Definition: AffineAnalysis.h:181

mlir::affine::normalizeMemRefType
MemRefType normalizeMemRefType(MemRefType memrefType)
Normalizes memrefType so that the affine layout map of the memref is transformed to an identity map w...
Definition: Utils.cpp:1864

mlir::affine::normalizeMemRef
LogicalResult normalizeMemRef(AllocLikeOp op)
Rewrites the memref defined by alloc or reinterpret_cast op to have an identity layout map and update...
Definition: Utils.cpp:1718

mlir::affine::delinearizeIndex
FailureOr< SmallVector< Value > > delinearizeIndex(OpBuilder &b, Location loc, Value linearIndex, ArrayRef< Value > basis, bool hasOuterBound=true)
Generate the IR to delinearize linearIndex given the basis and return the multi-index.
Definition: Utils.cpp:1967

mlir::affine::linearizeIndex
OpFoldResult linearizeIndex(ArrayRef< OpFoldResult > multiIndex, ArrayRef< OpFoldResult > basis, ImplicitLocOpBuilder &builder)
Definition: Utils.cpp:2027

mlir::affine::getDivMod
DivModValue getDivMod(OpBuilder &b, Location loc, Value lhs, Value rhs)
Create IR to calculate (div lhs, rhs) and (mod lhs, rhs).
Definition: Utils.cpp:1943

mlir::affine::hasNoInterveningEffect
bool hasNoInterveningEffect(Operation *start, T memOp, llvm::function_ref< bool(Value, Value)> mayAlias)
Ensure that all operations that could be executed after start (noninclusive) and prior to memOp (e....
Definition: Utils.cpp:687

mlir::affine::createAffineComputationSlice
void createAffineComputationSlice(Operation *opInst, SmallVectorImpl< AffineApplyOp > *sliceOps)
Given an operation, inserts one or more single result affine apply operations, results of which are e...
Definition: Utils.cpp:1413

mlir::affine::hoistAffineIfOp
LogicalResult hoistAffineIfOp(AffineIfOp ifOp, bool *folded=nullptr)
Hoists out affine.if/else to as high as possible, i.e., past all invariant affine....
Definition: Utils.cpp:414

mlir::affine::noDependence
bool noDependence(DependenceResult result)
Returns true if the provided DependenceResult corresponds to the absence of a dependence.
Definition: AffineAnalysis.h:187

mlir::affine::replaceAllMemRefUsesWith
LogicalResult replaceAllMemRefUsesWith(Value oldMemRef, Value newMemRef, ArrayRef< Value > extraIndices={}, AffineMap indexRemap=AffineMap(), ArrayRef< Value > extraOperands={}, ArrayRef< Value > symbolOperands={}, llvm::function_ref< bool(Operation *)> userFilterFn=nullptr, bool allowNonDereferencingOps=false, bool replaceInDeallocOp=false)
Replaces all "dereferencing" uses of oldMemRef with newMemRef while optionally remapping the old memr...
Definition: Utils.cpp:1306

mlir::affine::substWithMin
AffineExpr substWithMin(AffineExpr e, AffineExpr dim, AffineExpr min, AffineExpr max, bool positivePath=true)
Traverse e and return an AffineExpr where all occurrences of dim have been replaced by either:
Definition: Utils.cpp:467

mlir::detail::enumerate
constexpr void enumerate(std::tuple< Tys... > &tuple, CallbackT &&callback)
Definition: Matchers.h:344

mlir::remark::failed
detail::InFlightRemark failed(Location loc, RemarkOpts opts)
Report an optimization remark that failed.
Definition: Remarks.h:561

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::simplifyAffineMap
AffineMap simplifyAffineMap(AffineMap map)
Simplifies an affine map by simplifying its underlying AffineExpr results.
Definition: AffineMap.cpp:766

mlir::getType
Type getType(OpFoldResult ofr)
Returns the int type of the integer in ofr.
Definition: Utils.cpp:304

mlir::bindDims
void bindDims(MLIRContext *ctx, AffineExprTy &...exprs)
Bind a list of AffineExpr references to DimExpr at positions: [0 .
Definition: AffineExpr.h:311

mlir::computeLinearIndex
std::pair< AffineExpr, SmallVector< OpFoldResult > > computeLinearIndex(OpFoldResult sourceOffset, ArrayRef< OpFoldResult > strides, ArrayRef< OpFoldResult > indices)
Compute linear index from provided strides and indices, assuming strided layout.
Definition: IndexingUtils.cpp:286

mlir::applyPatternsGreedily
LogicalResult applyPatternsGreedily(Region &region, const FrozenRewritePatternSet &patterns, GreedyRewriteConfig config=GreedyRewriteConfig(), bool *changed=nullptr)
Rewrite ops in the given region, which must be isolated from above, by repeatedly applying the highes...
Definition: GreedyPatternRewriteDriver.cpp:913

mlir::computeStrides
SmallVector< int64_t > computeStrides(ArrayRef< int64_t > sizes)
Definition: IndexingUtils.h:47

mlir::emitError
InFlightDiagnostic emitError(Location loc)
Utility method to emit an error message using this location.
Definition: Diagnostics.cpp:328

mlir::applyOpPatternsGreedily
LogicalResult applyOpPatternsGreedily(ArrayRef< Operation * > ops, const FrozenRewritePatternSet &patterns, GreedyRewriteConfig config=GreedyRewriteConfig(), bool *changed=nullptr, bool *allErased=nullptr)
Rewrite the specified ops by repeatedly applying the highest benefit patterns in a greedy worklist dr...
Definition: GreedyPatternRewriteDriver.cpp:1030

mlir::AffineExprKind::CeilDiv
@ CeilDiv
RHS of ceildiv is always a constant or a symbolic expression.

mlir::AffineExprKind::Mod
@ Mod
RHS of mod is always a constant or a symbolic expression with a positive value.

mlir::AffineExprKind::FloorDiv
@ FloorDiv
RHS of floordiv is always a constant or a symbolic expression.

mlir::AffineExprKind::Add
@ Add

mlir::getAffineBinaryOpExpr
AffineExpr getAffineBinaryOpExpr(AffineExprKind kind, AffineExpr lhs, AffineExpr rhs)
Definition: AffineExpr.cpp:68

mlir::patterns
const FrozenRewritePatternSet & patterns
Definition: GreedyPatternRewriteDriver.h:283

mlir::bindSymbols
void bindSymbols(MLIRContext *ctx, AffineExprTy &...exprs)
Bind a list of AffineExpr references to SymbolExpr at positions: [0 .
Definition: AffineExpr.h:325

mlir::getValueOrCreateConstantIndexOp
Value getValueOrCreateConstantIndexOp(OpBuilder &b, Location loc, OpFoldResult ofr)
Converts an OpFoldResult to a Value.
Definition: Utils.cpp:111

mlir::getAffineConstantExpr
AffineExpr getAffineConstantExpr(int64_t constant, MLIRContext *context)
Definition: AffineExpr.cpp:643

mlir::get
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
Definition: BytecodeImplementation.h:509

mlir::GreedyRewriteStrictness::ExistingOps
@ ExistingOps
Only pre-existing ops are processed.

mlir::getAffineDimExpr
AffineExpr getAffineDimExpr(unsigned position, MLIRContext *context)
These free functions allow clients of the API to not use classes in detail.
Definition: AffineExpr.cpp:619

mlir::getAffineSymbolExpr
AffineExpr getAffineSymbolExpr(unsigned position, MLIRContext *context)
Definition: AffineExpr.cpp:629

mlir::MemoryEffects::Read
The following effect indicates that the operation reads from some resource.
Definition: SideEffectInterfaces.h:374

mlir::OpTrait::MemRefsNormalizable
Definition: OpDefinition.h:1377

mlir::OperationState
This represents an operation in an abstracted form, suitable for use with the builder APIs.
Definition: OperationSupport.h:948

mlir::affine::DependenceResult
Checks whether two accesses to the same memref access the same element.
Definition: AffineAnalysis.h:163

mlir::affine::DivModValue
Holds the result of (div a, b) and (mod a, b).
Definition: Utils.h:309

mlir::affine::DivModValue::remainder
Value remainder
Definition: Utils.h:311

mlir::affine::DivModValue::quotient
Value quotient
Definition: Utils.h:310

mlir::affine::LoopReduction
A description of a (parallelizable) reduction in an affine loop.
Definition: AffineAnalysis.h:35

mlir::affine::LoopReduction::kind
arith::AtomicRMWKind kind
Reduction kind.
Definition: AffineAnalysis.h:37

mlir::affine::LoopReduction::value
Value value
The value being reduced.
Definition: AffineAnalysis.h:43

mlir::affine::MemRefAccess
Encapsulates a memref load or store access information.
Definition: AffineAnalysis.h:82

mlir::affine::MemRefAccess::opInst
Operation * opInst
Definition: AffineAnalysis.h:84

mlir::affine::MemRefAccess::memref
Value memref
Definition: AffineAnalysis.h:83

j
Eliminates variable at the specified position using Fourier-Motzkin variable elimination.