doxygen/TosaToArith_8cpp_source.html

 //===- TosaToArith.cpp - Lowering Tosa to Arith Dialect -------------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//

 //

 // These rewriters lower from the Tosa to the Arith dialect.

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Conversion/TosaToArith/TosaToArith.h"

 #include "mlir/Dialect/Arith/IR/Arith.h"

 #include "mlir/Dialect/Tosa/IR/TosaOps.h"

 #include "mlir/IR/PatternMatch.h"

 #include "mlir/IR/TypeUtilities.h"

 #include "mlir/Transforms/GreedyPatternRewriteDriver.h"


 using namespace mlir;

 using namespace tosa;


 namespace {


 class ConstOpConverter : public OpRewritePattern<tosa::ConstOp> {

 public:

   using OpRewritePattern<tosa::ConstOp>::OpRewritePattern;


   LogicalResult matchAndRewrite(tosa::ConstOp op,

                                 PatternRewriter &rewriter) const final {

     rewriter.replaceOpWithNewOp<arith::ConstantOp>(op, op.getValues());

     return success();

   }

 };


 Type matchContainerType(Type element, Type container) {

   if (auto shapedTy = dyn_cast<ShapedType>(container))

     return shapedTy.clone(element);


   return element;

 }


 TypedAttr getConstantAttr(Type type, int64_t value, PatternRewriter &rewriter) {

   if (auto shapedTy = dyn_cast<ShapedType>(type)) {

     Type eTy = shapedTy.getElementType();

     APInt valueInt(eTy.getIntOrFloatBitWidth(), value, /*isSigned=*/true);

     return DenseIntElementsAttr::get(shapedTy, valueInt);

   }


   return rewriter.getIntegerAttr(type, value);

 }


 Value getConstantValue(Location loc, Type type, int64_t value,

                        PatternRewriter &rewriter) {

   return rewriter.create<arith::ConstantOp>(

       loc, getConstantAttr(type, value, rewriter));

 }


 // This converts the TOSA ApplyScale operator to a set of arithmetic ops,

 // using 64-bit operations to perform the necessary multiply, bias, and shift.

 class ApplyScaleGenericOpConverter

     : public OpRewritePattern<tosa::ApplyScaleOp> {

 public:

   using OpRewritePattern<tosa::ApplyScaleOp>::OpRewritePattern;


   LogicalResult matchAndRewrite(tosa::ApplyScaleOp op,

                                 PatternRewriter &rewriter) const final {

     StringRef roundingMode = op.getRoundingMode();

     if (roundingMode != "DOUBLE_ROUND" && roundingMode != "SINGLE_ROUND") {

       return failure();

     }


     Location loc = op.getLoc();

     Value value = op.getValue();

     Value multiplier32 = op.getMultiplier();


     Type resultTy = op.getType();

     Type valueTy = value.getType();

     Type i32Ty = matchContainerType(rewriter.getI32Type(), resultTy);

     Type i64Ty = matchContainerType(rewriter.getI64Type(), resultTy);


     Value zero = getConstantValue(loc, valueTy, 0, rewriter);

     Value one64 = getConstantValue(loc, i64Ty, 1, rewriter);

     Value thirtyOne32 = getConstantValue(loc, i32Ty, 31, rewriter);


     Value shift32 = rewriter.create<arith::ExtUIOp>(loc, i32Ty, op.getShift());


     // Compute the multiplication in 64-bits then select the high / low parts.

     Value value64 = value;

     if (getElementTypeOrSelf(valueTy) != rewriter.getI64Type())

       value64 = rewriter.create<arith::ExtSIOp>(loc, i64Ty, value);

     Value multiplier64 =

         rewriter.create<arith::ExtSIOp>(loc, i64Ty, multiplier32);

     Value multiply64 =

         rewriter.create<arith::MulIOp>(loc, value64, multiplier64);


     // Apply normal rounding.

     Value shift64 = rewriter.create<arith::ExtUIOp>(loc, i64Ty, shift32);

     Value round = rewriter.create<arith::ShLIOp>(loc, one64, shift64);

     round = rewriter.create<arith::ShRUIOp>(loc, round, one64);

     multiply64 = rewriter.create<arith::AddIOp>(loc, multiply64, round);


     // Apply double rounding if necessary.

     if (op.getRoundingMode() == "DOUBLE_ROUND") {

       int64_t roundInt = 1 << 30;

       Value roundUp = getConstantValue(loc, i64Ty, roundInt, rewriter);

       Value roundDown = getConstantValue(loc, i64Ty, -roundInt, rewriter);

       Value positive = rewriter.create<arith::CmpIOp>(

           loc, arith::CmpIPredicate::sge, value, zero);

       Value dir =

           rewriter.create<arith::SelectOp>(loc, positive, roundUp, roundDown);

       Value val = rewriter.create<arith::AddIOp>(loc, dir, multiply64);

       Value valid = rewriter.create<arith::CmpIOp>(

           loc, arith::CmpIPredicate::sgt, shift32, thirtyOne32);

       multiply64 =

           rewriter.create<arith::SelectOp>(loc, valid, val, multiply64);

     }


     Value result64 = rewriter.create<arith::ShRSIOp>(loc, multiply64, shift64);

     Value result32 = rewriter.create<arith::TruncIOp>(loc, i32Ty, result64);


     rewriter.replaceOp(op, result32);

     return success();

   }

 };


 class ApplyScale32BitOpConverter : public OpRewritePattern<tosa::ApplyScaleOp> {

 public:

   using OpRewritePattern<tosa::ApplyScaleOp>::OpRewritePattern;


   LogicalResult matchAndRewrite(tosa::ApplyScaleOp op,

                                 PatternRewriter &rewriter) const final {

     StringRef roundingMode = op.getRoundingMode();

     if (roundingMode != "DOUBLE_ROUND" && roundingMode != "SINGLE_ROUND") {

       return failure();

     }


     Location loc = op.getLoc();


     Type resultTy = op.getType();

     Type i32Ty = matchContainerType(rewriter.getI32Type(), resultTy);


     Value value = op.getValue();

     if (getElementTypeOrSelf(value.getType()).getIntOrFloatBitWidth() > 32) {

       return failure();

     }


     Value value32 = op.getValue();

     Value multiplier32 = op.getMultiplier();

     Value shift32 = rewriter.create<arith::ExtUIOp>(loc, i32Ty, op.getShift());


     // Constants used during the scaling operation.

     Value zero32 = getConstantValue(loc, i32Ty, 0, rewriter);

     Value one32 = getConstantValue(loc, i32Ty, 1, rewriter);

     Value two32 = getConstantValue(loc, i32Ty, 2, rewriter);

     Value thirty32 = getConstantValue(loc, i32Ty, 30, rewriter);

     Value thirtyTwo32 = getConstantValue(loc, i32Ty, 32, rewriter);


     // Compute the multiplication in 64-bits then select the high / low parts.

     // Grab out the high/low of the computation

     auto value64 =

         rewriter.create<arith::MulSIExtendedOp>(loc, value32, multiplier32);

     Value low32 = value64.getLow();

     Value high32 = value64.getHigh();


     // Determine the direction and amount to shift the high bits.

     Value shiftOver32 = rewriter.create<arith::CmpIOp>(

         loc, arith::CmpIPredicate::sge, shift32, thirtyTwo32);

     Value roundHighBits = rewriter.create<arith::CmpIOp>(

         loc, arith::CmpIPredicate::sgt, shift32, thirtyTwo32);


     Value shiftHighL =

         rewriter.create<arith::SubIOp>(loc, thirtyTwo32, shift32);

     Value shiftHighR =

         rewriter.create<arith::SubIOp>(loc, shift32, thirtyTwo32);


     shiftHighL =

         rewriter.create<arith::SelectOp>(loc, shiftOver32, zero32, shiftHighL);

     shiftHighR =

         rewriter.create<arith::SelectOp>(loc, shiftOver32, shiftHighR, zero32);


     // Conditionally perform our double round.

     if (op.getRoundingMode() == "DOUBLE_ROUND") {

       Value negOne32 = getConstantValue(loc, i32Ty, -1, rewriter);

       Value valuePositive = rewriter.create<arith::CmpIOp>(

           loc, arith::CmpIPredicate::sge, value32, zero32);


       Value roundDir =

           rewriter.create<arith::SelectOp>(loc, valuePositive, one32, negOne32);

       roundDir =

           rewriter.create<arith::SelectOp>(loc, shiftOver32, roundDir, zero32);


       Value shiftLow = rewriter.create<arith::ShRUIOp>(loc, low32, thirty32);

       Value rounded = rewriter.create<arith::AddIOp>(loc, shiftLow, roundDir);

       Value carry = rewriter.create<arith::ShRSIOp>(loc, rounded, two32);


       Value shiftRound =

           rewriter.create<arith::ShLIOp>(loc, roundDir, thirty32);


       low32 = rewriter.create<arith::AddIOp>(loc, low32, shiftRound);

       high32 = rewriter.create<arith::AddIOp>(loc, high32, carry);

     }


     // Conditionally apply rounding in the low bits.

     {

       Value shiftSubOne = rewriter.create<arith::SubIOp>(loc, shift32, one32);

       Value roundBit = rewriter.create<arith::ShLIOp>(loc, one32, shiftSubOne);

       roundBit = rewriter.create<arith::SelectOp>(loc, roundHighBits, zero32,

                                                   roundBit);


       Value newLow32 = rewriter.create<arith::AddIOp>(loc, low32, roundBit);

       Value wasRounded = rewriter.create<arith::CmpIOp>(

           loc, arith::CmpIPredicate::ugt, low32, newLow32);

       low32 = newLow32;


       Value rounded32 = rewriter.create<arith::ExtUIOp>(loc, i32Ty, wasRounded);

       high32 = rewriter.create<arith::AddIOp>(loc, high32, rounded32);

     }


     // Conditionally apply rounding in the high bits.

     {

       Value shiftSubOne =

           rewriter.create<arith::SubIOp>(loc, shiftHighR, one32);

       Value roundBit = rewriter.create<arith::ShLIOp>(loc, one32, shiftSubOne);

       roundBit = rewriter.create<arith::SelectOp>(loc, roundHighBits, roundBit,

                                                   zero32);

       high32 = rewriter.create<arith::AddIOp>(loc, high32, roundBit);

     }


     // Combine the correct high/low bits into the final rescale result.

     high32 = rewriter.create<arith::ShLIOp>(loc, high32, shiftHighL);

     high32 = rewriter.create<arith::ShRSIOp>(loc, high32, shiftHighR);

     low32 = rewriter.create<arith::ShRUIOp>(loc, low32, shift32);

     low32 = rewriter.create<arith::SelectOp>(loc, shiftOver32, zero32, low32);


     // Apply the rounding behavior and shift to the final alignment.

     Value result = rewriter.create<arith::AddIOp>(loc, low32, high32);


     // Truncate if necessary.

     if (!getElementTypeOrSelf(resultTy).isInteger(32)) {

       result = rewriter.create<arith::TruncIOp>(loc, resultTy, result);

     }


     rewriter.replaceOp(op, result);

     return success();

   }

 };


 } // namespace


 void mlir::tosa::populateTosaToArithConversionPatterns(

     RewritePatternSet *patterns) {

   patterns->add<ConstOpConverter>(patterns->getContext());

 }


 void mlir::tosa::populateTosaRescaleToArithConversionPatterns(

     RewritePatternSet *patterns, bool include32Bit) {

   patterns->add<ApplyScaleGenericOpConverter>(patterns->getContext(), 100);

   if (include32Bit) {

     patterns->add<ApplyScale32BitOpConverter>(patterns->getContext(), 200);

   }

 }

GreedyPatternRewriteDriver.h

PatternMatch.h

TosaOps.h

TosaToArith.h

TypeUtilities.h

mlir::Builder::getIntegerAttr
IntegerAttr getIntegerAttr(Type type, int64_t value)
Definition: Builders.cpp:224

mlir::Builder::getI64Type
IntegerType getI64Type()
Definition: Builders.cpp:65

mlir::Builder::getI32Type
IntegerType getI32Type()
Definition: Builders.cpp:63

mlir::DenseIntElementsAttr::get
static DenseIntElementsAttr get(const ShapedType &type, Arg &&arg)
Get an instance of a DenseIntElementsAttr with the given arguments.
Definition: BuiltinAttributes.h:963

mlir::Location
This class defines the main interface for locations in MLIR and acts as a non-nullable wrapper around...
Definition: Location.h:76

mlir::OpBuilder::create
Operation * create(const OperationState &state)
Creates an operation given the fields represented as an OperationState.
Definition: Builders.cpp:453

mlir::PatternRewriter
A special type of RewriterBase that coordinates the application of a rewrite pattern on the current I...
Definition: PatternMatch.h:749

mlir::RewritePatternSet
Definition: PatternMatch.h:772

mlir::RewriterBase::replaceOp
virtual void replaceOp(Operation *op, ValueRange newValues)
Replace the results of the given (original) operation with the specified list of values (replacements...
Definition: PatternMatch.cpp:129

mlir::Type
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
Definition: Types.h:74

mlir::Type::isInteger
bool isInteger() const
Return true if this is an integer type (with the specified width).
Definition: Types.cpp:56

mlir::Type::getIntOrFloatBitWidth
unsigned getIntOrFloatBitWidth() const
Return the bit width of an integer or a float type, assert failure on other types.
Definition: Types.cpp:122

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

mlir::Value::getType
Type getType() const
Return the type of this value.
Definition: Value.h:105

Arith.h

mlir::presburger::round
DynamicAPInt round(const Fraction &f)
Definition: Fraction.h:136

mlir::tosa::populateTosaRescaleToArithConversionPatterns
void populateTosaRescaleToArithConversionPatterns(RewritePatternSet *patterns, bool include32Bit=false)
Definition: TosaToArith.cpp:256

mlir::tosa::populateTosaToArithConversionPatterns
void populateTosaToArithConversionPatterns(RewritePatternSet *patterns)
Definition: TosaToArith.cpp:251

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::getElementTypeOrSelf
Type getElementTypeOrSelf(Type type)
Return the element type or return the type itself.
Definition: TypeUtilities.cpp:23

mlir::patterns
const FrozenRewritePatternSet & patterns
Definition: GreedyPatternRewriteDriver.h:283

mlir::OpRewritePattern
OpRewritePattern is a wrapper around RewritePattern that allows for matching and rewriting against an...
Definition: PatternMatch.h:314