doxygen/QuantUtils_8cpp_source.html

 //===- QuantUtils.cpp -----------------------------------------------------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//

 //

 // This file contains TOSA numerical support functions and quantization

 // attribute builders.

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Dialect/Tosa/Utils/QuantUtils.h"


 using namespace mlir;

 using namespace mlir::tosa;


 /// From a scale value, generates multiplier and shift values where

 /// mantissa is in [-1.0,-0.5] or [0.5, 1.0] such that

 /// multiplier = mantissa*2^shift for 16-bit scaling.

 static void computeMultiplierAndShiftTosaScale16(double scale,

                                                  int32_t &multiplier,

                                                  int32_t &shift) {


   const double mantissa = std::frexp(scale, &shift);

   auto shiftedM = std::round(mantissa * (int64_t(1) << 15));


   // Can't be greater than 1.0.

   assert(shiftedM <= (int64_t(1) << 15) &&

          "Shifted mantissa exceeds 16 signed bits");


   if (shiftedM == (int64_t(1) << 15)) {

     shiftedM /= 2;

     shift++;

   }


   // TOSA expects right shift to be positive and embed (1 << 15) into right

   // shift bits.

   shift = (-shift) + 15;


   assert(shiftedM <= std::numeric_limits<int32_t>::max() &&

          "Shifted mantissa exceeds 32-bit signed output type");


   multiplier = static_cast<int32_t>(shiftedM);


   // Shifting tops out at 62 bits. Right shift to make 62 bits the max.

   // The limit of 62 on shift allows the shift to be decomposed as

   // two right shifts of 31.

   if (shift > 62) {

     // Shifting the multiplier by more than 31-bits is unnecessary.

     multiplier = multiplier >> std::min<int32_t>(31, shift - 62);

     shift = 62;

   }

 }


 /// From a scale value, generates multiplier and shift values where

 /// mantissa is in [-1.0,-0.5] or [0.5, 1.0] such that

 /// multiplier = mantissa*2^shift for 32-bit scaling.

 static void computeMultiplierAndShiftTosaScale32(double scale,

                                                  int32_t &multiplier,

                                                  int32_t &shift) {


   const double mantissa = std::frexp(scale, &shift);

   auto shiftedM = std::round(mantissa * (int64_t(1) << 31));


   // Can't be greater than 1.0.

   assert(shiftedM <= (int64_t(1) << 31) &&

          "Shifted mantissa exceeds 32 signed bits");

   if (shiftedM == (int64_t(1) << 31)) {

     shiftedM /= 2;

     shift++;

   }


   // TOSA expects right shift to be positive, and embed (1 << 31) into right

   // shift bits.

   shift = (-shift) + 31;


   assert(shiftedM <= std::numeric_limits<int32_t>::max() &&

          "Shifted mantissa exceeds 32-bit signed output type");


   multiplier = static_cast<int32_t>(shiftedM);


   // Shifting tops out at 62 bits. Right shift to make 62 bits the max.

   // The limit of 62 on shift allows the shift to be decomposed as

   // two right shifts of 31.

   if (shift > 62) {

     // Shifting the multiplier by more than 32-bits is unnecessary.

     multiplier = multiplier >> std::min<int32_t>(31, shift - 62);

     shift = 62;

   }

 }


 /// Generates a quantized multiplier/shift from double.

 void mlir::tosa::computeMultiplierAndShift(double scale, int32_t &multiplier,

                                            int32_t &shift, int32_t scaleWidth) {


   switch (scaleWidth) {

   case 16:

     computeMultiplierAndShiftTosaScale16(scale, multiplier, shift);

     return;

   case 32:

     computeMultiplierAndShiftTosaScale32(scale, multiplier, shift);

     return;

   default:

     assert(0 && "Unsupported Tosa quantized_scale regime specified!");

   }

 }


 #define GET_UQTYPE(inputType)                                                  \

   (llvm::dyn_cast<quant::UniformQuantizedType>((inputType).getElementType()))

 #define GET_QTYPE(inputType)                                                   \

   (llvm::dyn_cast<quant::QuantizedType>((inputType).getElementType()))


 /// Method to build ConvOpQuantizationAttr, called from

 /// ConvOpQuantInfoBuilder/TransConvOpQuantInfoBuilder:

 /// input_zp: input zeropoint

 /// weight_zp: weight zeropoint.

 ConvOpQuantizationAttr

 mlir::tosa::buildConvOpQuantizationAttr(OpBuilder &builder, Value input,

                                         Value weight) {


   auto inputType = dyn_cast<ShapedType>(input.getType());

   auto weightType = dyn_cast<ShapedType>(weight.getType());


   if (!inputType || !weightType)

     return nullptr;


   auto inputQType = GET_UQTYPE(inputType);

   auto weightPerTensorQType = GET_UQTYPE(weightType);

   auto weightPerAxisQType =

       dyn_cast<quant::UniformQuantizedPerAxisType>(weightType.getElementType());


   // Weights must be either per-tensor quantized or per-axis quantized.

   assert(!((bool)weightPerTensorQType && (bool)weightPerAxisQType) &&

          "Weights must be either per-tensor or per-axis quantized");


   // Either all quantized or all not quantized.

   assert(!((bool)inputQType ^

            ((bool)weightPerTensorQType || (bool)weightPerAxisQType)) &&

          "Inputs and weights must be all quantized or all not quantized");


   if (inputQType) {

     int64_t inputZp = inputQType.getZeroPoint();

     int64_t weightZp = 0;


     if (weightPerTensorQType) {

       weightZp = weightPerTensorQType.getZeroPoint();

     } else if (weightPerAxisQType) {

       weightZp = weightPerAxisQType.getZeroPoints().front();

     }


     return builder.getAttr<tosa::ConvOpQuantizationAttr>(inputZp, weightZp);

   }


   return nullptr;

 }


 /// Builds MatMulOpQuantizationAttr, called from

 /// MatMulOpQuantInfoBuilder:

 /// aZp: input a zeropoint

 /// bZp: input b zeropoint.

 MatMulOpQuantizationAttr

 mlir::tosa::buildMatMulOpQuantizationAttr(OpBuilder &builder, Value a,

                                           Value b) {


   auto aType = dyn_cast<ShapedType>(a.getType());

   auto bType = dyn_cast<ShapedType>(b.getType());


   if (!aType || !bType)

     return nullptr;


   auto aQType = GET_UQTYPE(aType);

   auto bQType = GET_UQTYPE(bType);


   // A and B are either all quantized or all not quantized.

   assert(!((bool)aQType ^ (bool)bQType) &&

          "Matmul operands must be all quantized or all not quantized");


   if (aQType) {

     return builder.getAttr<tosa::MatMulOpQuantizationAttr>(

         aQType.getZeroPoint(), bQType.getZeroPoint());

   }


   return nullptr;

 }


 /// Builds UnaryOpQuantizationAttr

 /// UnaryOpQuantInfoBuilder:

 /// inputZp: input zeropoint

 /// outputZp: output zeropoint.

 UnaryOpQuantizationAttr

 mlir::tosa::buildUnaryOpQuantizationAttr(OpBuilder &builder, Value input,

                                          Type outputRawType) {


   auto inputType = dyn_cast<ShapedType>(input.getType());

   auto outputType = dyn_cast<ShapedType>(outputRawType);


   if (!inputType || !outputType)

     return nullptr;


   auto inputQType = GET_UQTYPE(inputType);

   auto outputQType = GET_UQTYPE(outputType);


   // Either all quantized or all not quantized.

   assert(!((bool)inputQType ^ (bool)outputQType) &&

          "Unary inputs/outputs must be all quantized or all not quantized");


   if (inputQType) {

     return builder.getAttr<UnaryOpQuantizationAttr>(inputQType.getZeroPoint(),

                                                     outputQType.getZeroPoint());

   }


   return nullptr;

 }


 /// Builds PadOpQuantizationAttr, called from PadOpQuantInfoBuilder:

 /// inputZp: input zeropoint.

 PadOpQuantizationAttr mlir::tosa::buildPadOpQuantizationAttr(OpBuilder &builder,

                                                              Value input) {


   auto inputType = dyn_cast<ShapedType>(input.getType());


   if (!inputType)

     return nullptr;


   auto inputQType = GET_UQTYPE(inputType);


   if (inputQType) {

     return builder.getAttr<tosa::PadOpQuantizationAttr>(

         inputQType.getZeroPoint());

   }


   return nullptr;

 }


 /// Builds output type for a quantized ConvOp with the right bitwidth.

 /// This is called by the builder when dealing with quantized content.

 Type mlir::tosa::buildConvOpResultTypeInfo(OpBuilder &builder, Type outputType,

                                            Value input, Value weight) {


   auto inputType = dyn_cast<ShapedType>(input.getType());

   auto weightType = dyn_cast<ShapedType>(weight.getType());


   assert(inputType && weightType &&

          "Could not extract input or weight tensors from Conv op");


   auto inputQType = GET_QTYPE(inputType);

   auto weightQType = GET_QTYPE(weightType);


   assert(inputQType && weightQType &&

          "Could not extract input or weight tensor types from Conv op");


   unsigned inputBits = inputQType.getStorageTypeIntegralWidth();

   unsigned weightBits = weightQType.getStorageTypeIntegralWidth();


   auto outputShapedType = dyn_cast<ShapedType>(outputType);

   assert(outputShapedType &&

          "Could not extract output shape type from Conv op");


   IntegerType accElementType;

   if (inputBits == 16 && weightBits == 8)

     accElementType = builder.getIntegerType(48);

   else

     accElementType = builder.getI32Type();

   auto accType = outputShapedType.clone(accElementType);

   return accType;

 }


 /// Builds Tosa quantization attributes from min/max values.

 Type mlir::tosa::buildQTypeFromMinMax(OpBuilder builder, Type inputDType,

                                       Attribute minAttr, Attribute maxAttr,

                                       IntegerAttr quantBits, int filterQuantDim,

                                       bool isSigned, BoolAttr narrowRange) {


   quant::QuantizedType retType;


   auto convfunc =

       quant::ExpressedToQuantizedConverter::forInputType(inputDType);


   auto minElems = dyn_cast<DenseFPElementsAttr>(minAttr);

   auto maxElems = dyn_cast<DenseFPElementsAttr>(maxAttr);


   SmallVector<double, 2> min, max;


   // At least one is per-axis quantized elementsattr.

   if (minElems || maxElems) {

     // Must have the same number of elements.

     if (minElems.getNumElements() != maxElems.getNumElements())

       return {};

     min.reserve(minElems.getNumElements());

     max.reserve(maxElems.getNumElements());

     for (auto i : minElems)

       min.push_back(FloatAttr::getValueAsDouble(i));

     for (auto i : maxElems)

       max.push_back(FloatAttr::getValueAsDouble(i));

   } else { // Just a single FP value.

     auto minVal = dyn_cast<FloatAttr>(minAttr);

     if (minVal)

       min.push_back(minVal.getValueAsDouble());

     else

       return {};

     auto maxVal = dyn_cast<FloatAttr>(maxAttr);

     if (maxVal)

       max.push_back(maxVal.getValueAsDouble());

     else

       return {};

   }


   if (min.size() == max.size()) {

     if (min.size() == 1) { // Per-tensor quantization with one min/max pair.

       retType = quant::fakeQuantAttrsToType(

           builder.getUnknownLoc(), quantBits.getInt(), min[0], max[0],

           narrowRange.getValue(), convfunc.expressedType, isSigned);

     } else if (min.size() > 1) { // Per-axis quant on filterQuantDim.

       auto shape = dyn_cast<ShapedType>(inputDType);

       if (!shape)

         return {};

       if ((filterQuantDim) >= 0 && (shape.getRank() > filterQuantDim)) {

         retType = quant::fakeQuantAttrsToType(

             builder.getUnknownLoc(), quantBits.getInt(), filterQuantDim, min[0],

             max[0], narrowRange.getValue(), convfunc.expressedType, isSigned);

       }

     } else {

       return {};

     }

   } else {

     return {};

   }


   if (!retType)

     return {};


   return convfunc.convert(retType);

 }


 /// Builds Tosa quantization attributes from min/max values.

 TypeAttr

 mlir::tosa::buildQTypeAttrFromMinMax(OpBuilder builder, Type inputDtype,

                                      Attribute minAttr, Attribute maxAttr,

                                      IntegerAttr quantBits, int filterQuantDim,

                                      bool isSigned, BoolAttr narrowRange) {


   return TypeAttr::get(buildQTypeFromMinMax(builder, inputDtype, minAttr,

                                             maxAttr, quantBits, filterQuantDim,

                                             isSigned, narrowRange));

 }

frexp
static std::pair< Value, Value > frexp(ImplicitLocOpBuilder &builder, Value arg, bool isPositive=false)
Definition: PolynomialApproximation.cpp:227

max
static Value max(ImplicitLocOpBuilder &builder, Value value, Value bound)
Definition: PolynomialApproximation.cpp:213

min
static Value min(ImplicitLocOpBuilder &builder, Value value, Value bound)
Definition: PolynomialApproximation.cpp:206

GET_UQTYPE
#define GET_UQTYPE(inputType)
Definition: QuantUtils.cpp:110

computeMultiplierAndShiftTosaScale16
static void computeMultiplierAndShiftTosaScale16(double scale, int32_t &multiplier, int32_t &shift)
From a scale value, generates multiplier and shift values where mantissa is in [-1....
Definition: QuantUtils.cpp:22

GET_QTYPE
#define GET_QTYPE(inputType)
Definition: QuantUtils.cpp:112

computeMultiplierAndShiftTosaScale32
static void computeMultiplierAndShiftTosaScale32(double scale, int32_t &multiplier, int32_t &shift)
From a scale value, generates multiplier and shift values where mantissa is in [-1....
Definition: QuantUtils.cpp:60

QuantUtils.h

llvm::SmallVector
Definition: LLVM.h:69

mlir::Attribute
Attributes are known-constant values of operations.
Definition: Attributes.h:25

mlir::BoolAttr
Special case of IntegerAttr to represent boolean integers, i.e., signless i1 integers.
Definition: BuiltinAttributes.h:844

mlir::BoolAttr::getValue
bool getValue() const
Return the boolean value of this attribute.
Definition: BuiltinAttributes.cpp:405

mlir::Builder::getI32Type
IntegerType getI32Type()
Definition: Builders.cpp:83

mlir::Builder::getIntegerType
IntegerType getIntegerType(unsigned width)
Definition: Builders.cpp:87

mlir::Builder::getUnknownLoc
Location getUnknownLoc()
Definition: Builders.cpp:27

mlir::Builder::getAttr
Attr getAttr(Args &&...args)
Get or construct an instance of the attribute Attr with provided arguments.
Definition: Builders.h:100

mlir::OpBuilder
This class helps build Operations.
Definition: Builders.h:209

mlir::Type
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
Definition: Types.h:74

mlir::Value
This class represents an instance of an SSA value in the MLIR system, representing a computable value...
Definition: Value.h:96

mlir::Value::getType
Type getType() const
Return the type of this value.
Definition: Value.h:129

mlir::quant::QuantizedType
Base class for all quantized types known to this dialect.
Definition: QuantTypes.h:49

mlir::presburger::round
MPInt round(const Fraction &f)
Definition: Fraction.h:133

mlir::quant::fakeQuantAttrsToType
UniformQuantizedType fakeQuantAttrsToType(Location loc, unsigned numBits, double rmin, double rmax, bool narrowRange, Type expressedType, bool isSigned=false)
Converts per-layer FakeQuant attributes to the corresponding type.
Definition: FakeQuantSupport.cpp:108

mlir::tosa
Definition: TosaToArith.h:23

mlir::tosa::buildConvOpQuantizationAttr
ConvOpQuantizationAttr buildConvOpQuantizationAttr(OpBuilder &builder, Value input, Value weight)
Method to build ConvOpQuantizationAttr, called from ConvOpQuantInfoBuilder/TransConvOpQuantInfoBuilde...
Definition: QuantUtils.cpp:120

mlir::tosa::buildQTypeAttrFromMinMax
TypeAttr buildQTypeAttrFromMinMax(OpBuilder builder, Type inputDType, Attribute minAttr, Attribute maxAttr, IntegerAttr quantBits, int filterQuantDim, bool isSigned, BoolAttr narrowRange)
Builds Tosa quantization attributes from min/max values.
Definition: QuantUtils.cpp:339

mlir::tosa::buildConvOpResultTypeInfo
Type buildConvOpResultTypeInfo(OpBuilder &builder, Type outputType, Value input, Value weight)
construct ConvOp output type with correct bitwidth based on input/weight width.
Definition: QuantUtils.cpp:239

mlir::tosa::buildQTypeFromMinMax
Type buildQTypeFromMinMax(OpBuilder builder, Type inputDType, Attribute minAttr, Attribute maxAttr, IntegerAttr quantBits, int filterQuantDim, bool isSigned, BoolAttr narrowRange)
Builds Tosa quantization attributes from min/max values.
Definition: QuantUtils.cpp:271

mlir::tosa::buildPadOpQuantizationAttr
PadOpQuantizationAttr buildPadOpQuantizationAttr(OpBuilder &builder, Value input)
Builds PadOpQuantizationAttr, called from PadOpQuantInfoBuilder: inputZp: input zeropoint.
Definition: QuantUtils.cpp:219

mlir::tosa::buildMatMulOpQuantizationAttr
MatMulOpQuantizationAttr buildMatMulOpQuantizationAttr(OpBuilder &builder, Value a, Value b)
Builds MatMulOpQuantizationAttr, called from MatMulOpQuantInfoBuilder: aZp: input a zeropoint bZp: in...
Definition: QuantUtils.cpp:164

mlir::tosa::computeMultiplierAndShift
void computeMultiplierAndShift(double scale, int32_t &multiplier, int32_t &shift, int32_t scaleWidth)
From a scale value, computes multiplier and shift values for 16 or 32-bit scale widths.
Definition: QuantUtils.cpp:95

mlir::tosa::buildUnaryOpQuantizationAttr
UnaryOpQuantizationAttr buildUnaryOpQuantizationAttr(OpBuilder &builder, Value input, Type outputRawType)
Builds UnaryOpQuantizationAttr UnaryOpQuantInfoBuilder: inputZp: input zeropoint outputZp: output zer...
Definition: QuantUtils.cpp:193

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::get
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
Definition: BytecodeImplementation.h:510

mlir::quant::ExpressedToQuantizedConverter::forInputType
static ExpressedToQuantizedConverter forInputType(Type inputType)
Creates a converter for the given input type.
Definition: UniformSupport.cpp:21