doxygen/Dialect_2Quant_2IR_2TypeParser_8cpp_source.html

 //===- TypeParser.h - Quantization Type Parser ------------------*- C++ -*-===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Dialect/Quant/IR/Quant.h"

 #include "mlir/Dialect/Quant/IR/QuantTypes.h"

 #include "mlir/IR/BuiltinTypes.h"

 #include "mlir/IR/DialectImplementation.h"

 #include "mlir/IR/Types.h"

 #include "llvm/ADT/APFloat.h"


 using namespace mlir;

 using namespace quant;


 static IntegerType parseStorageType(DialectAsmParser &parser, bool &isSigned) {

   auto typeLoc = parser.getCurrentLocation();

   IntegerType type;


   // Parse storage type (alpha_ident, integer_literal).

   StringRef identifier;

   unsigned storageTypeWidth = 0;

   OptionalParseResult result = parser.parseOptionalType(type);

   if (result.has_value()) {

     if (!succeeded(*result))

       return nullptr;

     isSigned = !type.isUnsigned();

     storageTypeWidth = type.getWidth();

   } else if (succeeded(parser.parseKeyword(&identifier))) {

     // Otherwise, this must be an unsigned integer (`u` integer-literal).

     if (!identifier.consume_front("u")) {

       parser.emitError(typeLoc, "illegal storage type prefix");

       return nullptr;

     }

     if (identifier.getAsInteger(10, storageTypeWidth)) {

       parser.emitError(typeLoc, "expected storage type width");

       return nullptr;

     }

     isSigned = false;

     type = parser.getBuilder().getIntegerType(storageTypeWidth);

   } else {

     return nullptr;

   }


   if (storageTypeWidth == 0 ||

       storageTypeWidth > QuantizedType::MaxStorageBits) {

     parser.emitError(typeLoc, "illegal storage type size: ")

         << storageTypeWidth;

     return nullptr;

   }


   return type;

 }


 static ParseResult parseStorageRange(DialectAsmParser &parser,

                                      IntegerType storageType, bool isSigned,

                                      int64_t &storageTypeMin,

                                      int64_t &storageTypeMax) {

   int64_t defaultIntegerMin = QuantizedType::getDefaultMinimumForInteger(

       isSigned, storageType.getWidth());

   int64_t defaultIntegerMax = QuantizedType::getDefaultMaximumForInteger(

       isSigned, storageType.getWidth());

   if (failed(parser.parseOptionalLess())) {

     storageTypeMin = defaultIntegerMin;

     storageTypeMax = defaultIntegerMax;

     return success();

   }


   // Explicit storage min and storage max.

   SMLoc minLoc = parser.getCurrentLocation(), maxLoc;

   if (parser.parseInteger(storageTypeMin) || parser.parseColon() ||

       parser.getCurrentLocation(&maxLoc) ||

       parser.parseInteger(storageTypeMax) || parser.parseGreater())

     return failure();

   if (storageTypeMin < defaultIntegerMin) {

     return parser.emitError(minLoc, "illegal storage type minimum: ")

            << storageTypeMin;

   }

   if (storageTypeMax > defaultIntegerMax) {

     return parser.emitError(maxLoc, "illegal storage type maximum: ")

            << storageTypeMax;

   }

   return success();

 }


 static FloatType parseExpressedTypeAndRange(DialectAsmParser &parser,

                                             double &min, double &max) {

   auto typeLoc = parser.getCurrentLocation();

   FloatType type;


   if (failed(parser.parseType(type))) {

     parser.emitError(typeLoc, "expecting float expressed type");

     return nullptr;

   }


   // Calibrated min and max values.

   if (parser.parseLess() || parser.parseFloat(min) || parser.parseColon() ||

       parser.parseFloat(max) || parser.parseGreater()) {

     parser.emitError(typeLoc, "calibrated values must be present");

     return nullptr;

   }

   return type;

 }


 /// Parses an AnyQuantizedType.

 ///

 ///   any ::= `any<` storage-spec (expressed-type-spec)?`>`

 ///   storage-spec ::= storage-type (`<` storage-range `>`)?

 ///   storage-range ::= integer-literal `:` integer-literal

 ///   storage-type ::= (`i` | `u`) integer-literal

 ///   expressed-type-spec ::= `:` `f` integer-literal

 static Type parseAnyType(DialectAsmParser &parser) {

   IntegerType storageType;

   FloatType expressedType;

   unsigned typeFlags = 0;

   int64_t storageTypeMin;

   int64_t storageTypeMax;


   // Type specification.

   if (parser.parseLess())

     return nullptr;


   // Storage type.

   bool isSigned = false;

   storageType = parseStorageType(parser, isSigned);

   if (!storageType) {

     return nullptr;

   }

   if (isSigned) {

     typeFlags |= QuantizationFlags::Signed;

   }


   // Storage type range.

   if (parseStorageRange(parser, storageType, isSigned, storageTypeMin,

                         storageTypeMax)) {

     return nullptr;

   }


   // Optional expressed type.

   if (succeeded(parser.parseOptionalColon())) {

     if (parser.parseType(expressedType)) {

       return nullptr;

     }

   }


   if (parser.parseGreater()) {

     return nullptr;

   }


   return parser.getChecked<AnyQuantizedType>(

       typeFlags, storageType, expressedType, storageTypeMin, storageTypeMax);

 }


 /// Checks if the given scale value is within the valid range of the expressed

 /// type. The `expressedType` argument is the floating-point type used for

 /// expressing the quantized values, and `scale` is the double value to check.

 LogicalResult

 isScaleInExpressedTypeRange(function_ref<InFlightDiagnostic()> emitError,

                             Type expressedType, double scale) {

   auto floatType = cast<FloatType>(expressedType);

   double minScale =

       APFloat::getSmallest(floatType.getFloatSemantics()).convertToDouble();

   double maxScale =

       APFloat::getLargest(floatType.getFloatSemantics()).convertToDouble();

   if (scale < minScale || scale > maxScale)

     return emitError() << "scale " << scale << " out of expressed type range ["

                        << minScale << ", " << maxScale << "]";

   return success();

 }


 /// Parses a quantization parameter, which is either a scale value (float) or a

 /// scale-zero point pair (float:integer). `expressedType`, expressing the type

 /// of scale values, is used to validate the scale. The parsed scale and zero

 /// point (if any) are stored in `scale` and `zeroPoint`.

 static ParseResult parseQuantParams(DialectAsmParser &parser,

                                     Type expressedType, double &scale,

                                     int64_t &zeroPoint) {


   if (parser.parseFloat(scale)) {

     return failure();

   }


   if (failed(isScaleInExpressedTypeRange(

           [&]() { return parser.emitError(parser.getCurrentLocation()); },

           expressedType, scale))) {

     return failure();

   }


   zeroPoint = 0;

   if (failed(parser.parseOptionalColon())) {

     return success();

   }


   return parser.parseInteger(zeroPoint);

 }


 /// Parses block size information for sub-channel quantization, assuming the

 /// leading '{' has already been parsed. The block size information is provided

 /// as a comma-separated list of "Axis:BlockSize" pairs, terminated by a '}'.

 ///

 /// The parsed axis indices are stored in `quantizedDimensions`, and the

 /// corresponding block sizes are stored in `blockSizes`.

 static ParseResult

 parseBlockSizeInfoUntilRBrace(DialectAsmParser &parser,

                               SmallVectorImpl<int32_t> &quantizedDimensions,

                               SmallVectorImpl<int64_t> &blockSizes) {

   // Empty block-sizes info.

   if (succeeded(parser.parseOptionalRBrace())) {

     return success();

   }


   auto parseBlockSizeElements = [&]() -> ParseResult {

     quantizedDimensions.resize(quantizedDimensions.size() + 1);

     blockSizes.resize(blockSizes.size() + 1);

     if (parser.parseInteger(quantizedDimensions.back()) ||

         parser.parseColon() || parser.parseInteger(blockSizes.back()))

       return failure();

     return success();

   };


   if (parser.parseCommaSeparatedList(parseBlockSizeElements) ||

       parser.parseRBrace()) {

     return failure();

   }


   return success();

 }


 /// Parses a bracketed list of quantization parameters, returning the dimensions

 /// of the parsed sub-tensors in `dims`. The dimension of the list is prepended

 /// to the dimensions of the sub-tensors. This function assumes that the initial

 /// left brace has already been parsed. For example:

 ///

 ///   parseQuantParamListUntilRBrace(1.0:1, 2.0:4, 3.0:4}) -> Success,

 ///       dims = [3], scales = [1.0, 2.0, 3.0], zeroPoints = [1, 4, 4]

 ///

 ///   parseQuantParamListUntilRBrace({1.0, 2.0}, {3.0:1, 4.0:9}}) -> Success,

 ///       dims = [2, 2], scales = [1.0, 2.0, 3.0, 4.0], zeroPoints = [0, 0, 1,

 ///       9]

 ///

 /// This function expects all sub-tensors to have the same rank.

 static ParseResult

 parseQuantParamListUntilRBrace(DialectAsmParser &parser, Type expressedType,

                                SmallVectorImpl<double> &scales,

                                SmallVectorImpl<int64_t> &zeroPoints,

                                SmallVectorImpl<int64_t> &dims) {

   auto checkDims = [&](const SmallVectorImpl<int64_t> &prevDims,

                        const SmallVectorImpl<int64_t> &newDims) -> ParseResult {

     if (prevDims == newDims)

       return success();

     return parser.emitError(parser.getCurrentLocation())

            << "tensor literal is invalid; ranks are not consistent "

               "between elements";

   };


   bool first = true;

   SmallVector<int64_t, 4> newDims;

   unsigned size = 0;


   auto parseOneElement = [&]() -> ParseResult {

     SmallVector<int64_t, 4> thisDims;

     if (succeeded(parser.parseOptionalLBrace())) {

       if (parseQuantParamListUntilRBrace(parser, expressedType, scales,

                                          zeroPoints, thisDims))

         return failure();

     } else {

       zeroPoints.resize(zeroPoints.size() + 1);

       scales.resize(scales.size() + 1);

       if (parseQuantParams(parser, expressedType, scales.back(),

                            zeroPoints.back())) {

         return failure();

       }

     }

     ++size;

     if (!first)

       return checkDims(newDims, thisDims);

     newDims = thisDims;

     first = false;

     return success();

   };


   if (parser.parseCommaSeparatedList(parseOneElement) || parser.parseRBrace()) {

     return failure();

   }


   // Return the sublists' dimensions with 'size' prepended.

   dims.clear();

   dims.push_back(size);

   dims.append(newDims.begin(), newDims.end());


   return success();

 }


 /// Parses a UniformQuantizedType.

 ///

 ///   uniform_type ::= uniform_per_layer

 ///                  | uniform_per_axis

 ///                  | uniform_sub_channel

 ///   uniform_per_layer ::= `uniform<` storage-spec expressed-type-spec

 ///                          `,` scale-zero `>`

 ///   uniform_per_axis ::= `uniform<` storage-spec expressed-type-spec

 ///                        axis-spec `,` `{` scale-zero-list `}` `>`

 ///   uniform_sub_channel ::= `uniform<` storage-spec expressed-type-spec

 ///                        block-size-info `,` scale-zero-tensor `>`

 ///   storage-spec ::= storage-type (`<` storage-range `>`)?

 ///   storage-range ::= integer-literal `:` integer-literal

 ///   storage-type ::= (`i` | `u`) integer-literal

 ///   expressed-type-spec ::= `:` `f` integer-literal

 ///   axis-spec ::= `:` integer-literal

 ///   scale-zero ::= scale (`:` zero-point)?

 ///   scale ::= float-literal

 ///   zero-point ::= integer-literal

 ///   scale-zero-list ::= scale-zero (`,` scale-zero)*

 ///   block-size-info ::= `{` `}` | `{` axis-block `:` (`,` axis-block)* `}`

 ///   axis-block ::= axis-spec `:` block-size-spec

 ///   block-size-spec ::= integer-literal

 ///   scale-zero-tensor ::= scale-zero-dense-exp | scale-zero-list

 ///   scale-zero-dense-exp ::= `{`

 ///     scale-zero-tensor (`,` scale-zero-tensor)*

 ///   `}`

 static Type parseUniformType(DialectAsmParser &parser) {

   IntegerType storageType;

   FloatType expressedType;

   unsigned typeFlags = 0;

   int64_t storageTypeMin;

   int64_t storageTypeMax;

   bool isPerAxis = false;

   bool isSubChannel = false;

   SmallVector<int32_t, 1> quantizedDimensions;

   SmallVector<int64_t, 1> blockSizes;

   SmallVector<double, 1> scales;

   SmallVector<int64_t, 1> zeroPoints;


   // Type specification.

   if (parser.parseLess()) {

     return nullptr;

   }


   // Storage type.

   bool isSigned = false;

   storageType = parseStorageType(parser, isSigned);

   if (!storageType) {

     return nullptr;

   }

   if (isSigned) {

     typeFlags |= QuantizationFlags::Signed;

   }


   // Storage type range.

   if (parseStorageRange(parser, storageType, isSigned, storageTypeMin,

                         storageTypeMax)) {

     return nullptr;

   }


   // Expressed type.

   if (parser.parseColon() || parser.parseType(expressedType)) {

     return nullptr;

   }


   // Optionally parse quantized dimension for per-axis or sub-channel

   // quantization.

   if (succeeded(parser.parseOptionalColon())) {

     if (succeeded(parser.parseOptionalLBrace())) {

       isSubChannel = true;

       if (parseBlockSizeInfoUntilRBrace(parser, quantizedDimensions,

                                         blockSizes)) {

         return nullptr;

       }

     } else {

       isPerAxis = true;

       quantizedDimensions.resize(1);

       if (parser.parseInteger(quantizedDimensions.back())) {

         return nullptr;

       }

     }

   }


   // Comma leading into range_spec.

   if (parser.parseComma()) {

     return nullptr;

   }


   // Quantization parameter (scales/zeroPoints) specification.

   bool isPerTensor = !isPerAxis && !isSubChannel;

   SmallVector<int64_t> dims;

   if (isPerTensor) {

     zeroPoints.resize(zeroPoints.size() + 1);

     scales.resize(scales.size() + 1);

     if (parseQuantParams(parser, expressedType, scales.back(),

                          zeroPoints.back())) {

       return nullptr;

     }


   } else {

     if (parser.parseLBrace() ||

         parseQuantParamListUntilRBrace(parser, expressedType, scales,

                                        zeroPoints, dims)) {

       return nullptr;

     }

   }


   if (parser.parseGreater()) {

     return nullptr;

   }


   if (isPerAxis) {

     return parser.getChecked<UniformQuantizedPerAxisType>(

         typeFlags, storageType, expressedType, scales, zeroPoints,

         quantizedDimensions[0], storageTypeMin, storageTypeMax);

   } else if (isSubChannel) {

     SmallVector<APFloat> apFloatScales =

         llvm::to_vector(llvm::map_range(scales, [&](double scale) -> APFloat {

           APFloat apFloatScale(scale);

           bool unused;

           apFloatScale.convert(expressedType.getFloatSemantics(),

                                APFloat::rmNearestTiesToEven, &unused);

           return apFloatScale;

         }));

     SmallVector<APInt> apIntZeroPoints = llvm::to_vector(

         llvm::map_range(zeroPoints, [&](int64_t zeroPoint) -> APInt {

           return APInt(storageType.getIntOrFloatBitWidth(), zeroPoint);

         }));

     auto scalesRef = mlir::DenseElementsAttr::get(

         RankedTensorType::get(dims, expressedType), apFloatScales);

     auto zeroPointsRef = mlir::DenseElementsAttr::get(

         RankedTensorType::get(dims, storageType), apIntZeroPoints);

     return parser.getChecked<UniformQuantizedSubChannelType>(

         typeFlags, storageType, expressedType, scalesRef, zeroPointsRef,

         quantizedDimensions, blockSizes, storageTypeMin, storageTypeMax);

   }


   return parser.getChecked<UniformQuantizedType>(

       typeFlags, storageType, expressedType, scales.front(), zeroPoints.front(),

       storageTypeMin, storageTypeMax);

 }


 /// Parses an CalibratedQuantizedType.

 ///

 ///   calibrated ::= `calibrated<` expressed-spec `>`

 ///   expressed-spec ::= expressed-type `<` calibrated-range `>`

 ///   expressed-type ::= `f` integer-literal

 ///   calibrated-range ::= float-literal `:` float-literal

 static Type parseCalibratedType(DialectAsmParser &parser) {

   FloatType expressedType;

   double min;

   double max;


   // Type specification.

   if (parser.parseLess())

     return nullptr;


   // Expressed type.

   expressedType = parseExpressedTypeAndRange(parser, min, max);

   if (!expressedType) {

     return nullptr;

   }


   if (parser.parseGreater()) {

     return nullptr;

   }


   return parser.getChecked<CalibratedQuantizedType>(expressedType, min, max);

 }


 /// Parse a type registered to this dialect.

 Type QuantDialect::parseType(DialectAsmParser &parser) const {

   // All types start with an identifier that we switch on.

   StringRef typeNameSpelling;

   if (failed(parser.parseKeyword(&typeNameSpelling)))

     return nullptr;


   if (typeNameSpelling == "uniform")

     return parseUniformType(parser);

   if (typeNameSpelling == "any")

     return parseAnyType(parser);

   if (typeNameSpelling == "calibrated")

     return parseCalibratedType(parser);


   parser.emitError(parser.getNameLoc(),

                    "unknown quantized type " + typeNameSpelling);

   return nullptr;

 }


 static void printStorageType(QuantizedType type, DialectAsmPrinter &out) {

   // storage type

   unsigned storageWidth = type.getStorageTypeIntegralWidth();

   bool isSigned = type.isSigned();

   if (isSigned) {

     out << "i" << storageWidth;

   } else {

     out << "u" << storageWidth;

   }


   // storageTypeMin and storageTypeMax if not default.

   if (type.hasStorageTypeBounds()) {

     out << "<" << type.getStorageTypeMin() << ":" << type.getStorageTypeMax()

         << ">";

   }

 }


 static void printQuantParams(double scale, int64_t zeroPoint,

                              DialectAsmPrinter &out) {

   out << scale;

   if (zeroPoint != 0) {

     out << ":" << zeroPoint;

   }

 }


 static void

 printBlockSizeInfo(ArrayRef<std::pair<int32_t, int64_t>> blockSizeInfo,

                    DialectAsmPrinter &out) {

   out << "{";

   llvm::interleaveComma(

       llvm::seq<size_t>(0, blockSizeInfo.size()), out, [&](size_t index) {

         out << blockSizeInfo[index].first << ":" << blockSizeInfo[index].second;

       });

   out << "}";

 }


 /// Helper that prints a AnyQuantizedType.

 static void printAnyQuantizedType(AnyQuantizedType type,

                                   DialectAsmPrinter &out) {

   out << "any<";

   printStorageType(type, out);

   if (Type expressedType = type.getExpressedType()) {

     out << ":" << expressedType;

   }

   out << ">";

 }


 /// Helper that prints a UniformQuantizedType.

 static void printUniformQuantizedType(UniformQuantizedType type,

                                       DialectAsmPrinter &out) {

   out << "uniform<";

   printStorageType(type, out);

   out << ":" << type.getExpressedType() << ", ";


   // scheme specific parameters

   printQuantParams(type.getScale(), type.getZeroPoint(), out);

   out << ">";

 }


 /// Helper that prints a UniformQuantizedPerAxisType.

 static void printUniformQuantizedPerAxisType(UniformQuantizedPerAxisType type,

                                              DialectAsmPrinter &out) {

   out << "uniform<";

   printStorageType(type, out);

   out << ":" << type.getExpressedType() << ":";

   out << type.getQuantizedDimension();

   out << ", ";


   // scheme specific parameters

   ArrayRef<double> scales = type.getScales();

   ArrayRef<int64_t> zeroPoints = type.getZeroPoints();

   out << "{";

   llvm::interleave(

       llvm::seq<size_t>(0, scales.size()), out,

       [&](size_t index) {

         printQuantParams(scales[index], zeroPoints[index], out);

       },

       ",");

   out << "}>";

 }


 /// Prints quantization parameters as a nested list of `scale`[:`zero_point`]

 /// elements.  The nesting corresponds to the `shape` dimensions.

 ///

 /// Elements are delimited by commas, and the inner dimensions are enclosed in

 /// braces.  `zero_point` is only printed if it is non-zero.  For example:

 ///

 ///   printDenseQuantizationParameters(scales=[1.0, 2.0, 3.0, 4.0],

 ///                                   zeroPoints=[0, 0, 1, 9],

 ///                                   shape=[2, 2])

 ///

 ///   would print:

 ///

 ///     {{1.0, 2.0}, {3.0:1, 4.0:9}}

 void printDenseQuantizationParameters(ArrayRef<APFloat> scales,

                                       ArrayRef<APInt> zeroPoints,

                                       ArrayRef<int64_t> shape,

                                       DialectAsmPrinter &out) {

   int64_t rank = shape.size();

   SmallVector<unsigned, 4> counter(rank, 0);

   unsigned openBrackets = 0;


   auto incrementCounterAndDelimit = [&]() {

     ++counter[rank - 1];

     for (unsigned i = rank - 1; i > 0; --i) {

       if (counter[i] >= shape[i]) {

         counter[i] = 0;

         ++counter[i - 1];

         --openBrackets;

         out << '}';

       }

     }

   };


   for (unsigned idx = 0, e = scales.size(); idx < e; ++idx) {

     if (idx != 0)

       out << ", ";

     while (openBrackets++ < rank)

       out << '{';

     openBrackets = rank;

     out << scales[idx];

     if (zeroPoints[idx] != 0) {

       out << ":" << zeroPoints[idx];

     }

     incrementCounterAndDelimit();

   }

   while (openBrackets-- > 0)

     out << '}';

 }


 /// Helper that prints a UniformQuantizedSubChannelType.

 static void

 printUniformQuantizedSubChannelType(UniformQuantizedSubChannelType type,

                                     DialectAsmPrinter &out) {

   out << "uniform<";

   printStorageType(type, out);

   out << ":" << type.getExpressedType() << ":";

   printBlockSizeInfo(type.getBlockSizeInfo(), out);

   out << ", ";


   auto scalesItr = type.getScales().getValues<APFloat>();

   auto zeroPointsItr = type.getZeroPoints().getValues<APInt>();

   SmallVector<APFloat> scales(scalesItr.begin(), scalesItr.end());

   SmallVector<APInt> zeroPoints(zeroPointsItr.begin(), zeroPointsItr.end());

   printDenseQuantizationParameters(scales, zeroPoints,

                                    type.getScales().getType().getShape(), out);

   out << ">";

 }


 /// Helper that prints a CalibratedQuantizedType.

 static void printCalibratedQuantizedType(CalibratedQuantizedType type,

                                          DialectAsmPrinter &out) {

   out << "calibrated<" << type.getExpressedType();

   out << "<" << type.getMin() << ":" << type.getMax() << ">";

   out << ">";

 }


 /// Print a type registered to this dialect.

 void QuantDialect::printType(Type type, DialectAsmPrinter &os) const {

   if (auto anyType = llvm::dyn_cast<AnyQuantizedType>(type))

     printAnyQuantizedType(anyType, os);

   else if (auto uniformType = llvm::dyn_cast<UniformQuantizedType>(type))

     printUniformQuantizedType(uniformType, os);

   else if (auto perAxisType = llvm::dyn_cast<UniformQuantizedPerAxisType>(type))

     printUniformQuantizedPerAxisType(perAxisType, os);

   else if (auto perAxisType =

                llvm::dyn_cast<UniformQuantizedSubChannelType>(type))

     printUniformQuantizedSubChannelType(perAxisType, os);

   else if (auto calibratedType = llvm::dyn_cast<CalibratedQuantizedType>(type))

     printCalibratedQuantizedType(calibratedType, os);

   else

     llvm_unreachable("Unhandled quantized type");

 }

DialectImplementation.h

printBlockSizeInfo
static void printBlockSizeInfo(ArrayRef< std::pair< int32_t, int64_t >> blockSizeInfo, DialectAsmPrinter &out)
Definition: TypeParser.cpp:513

parseQuantParams
static ParseResult parseQuantParams(DialectAsmParser &parser, Type expressedType, double &scale, int64_t &zeroPoint)
Parses a quantization parameter, which is either a scale value (float) or a scale-zero point pair (fl...
Definition: TypeParser.cpp:178

printDenseQuantizationParameters
void printDenseQuantizationParameters(ArrayRef< APFloat > scales, ArrayRef< APInt > zeroPoints, ArrayRef< int64_t > shape, DialectAsmPrinter &out)
Prints quantization parameters as a nested list of scale[:zero_point] elements.
Definition: TypeParser.cpp:581

printAnyQuantizedType
static void printAnyQuantizedType(AnyQuantizedType type, DialectAsmPrinter &out)
Helper that prints a AnyQuantizedType.
Definition: TypeParser.cpp:524

isScaleInExpressedTypeRange
LogicalResult isScaleInExpressedTypeRange(function_ref< InFlightDiagnostic()> emitError, Type expressedType, double scale)
Checks if the given scale value is within the valid range of the expressed type.
Definition: TypeParser.cpp:161

parseExpressedTypeAndRange
static FloatType parseExpressedTypeAndRange(DialectAsmParser &parser, double &min, double &max)
Definition: TypeParser.cpp:89

printUniformQuantizedSubChannelType
static void printUniformQuantizedSubChannelType(UniformQuantizedSubChannelType type, DialectAsmPrinter &out)
Helper that prints a UniformQuantizedSubChannelType.
Definition: TypeParser.cpp:619

parseUniformType
static Type parseUniformType(DialectAsmParser &parser)
Parses a UniformQuantizedType.
Definition: TypeParser.cpp:324

parseStorageType
static IntegerType parseStorageType(DialectAsmParser &parser, bool &isSigned)
Definition: TypeParser.cpp:19

parseAnyType
static Type parseAnyType(DialectAsmParser &parser)
Parses an AnyQuantizedType.
Definition: TypeParser.cpp:115

printStorageType
static void printStorageType(QuantizedType type, DialectAsmPrinter &out)
Definition: TypeParser.cpp:487

parseBlockSizeInfoUntilRBrace
static ParseResult parseBlockSizeInfoUntilRBrace(DialectAsmParser &parser, SmallVectorImpl< int32_t > &quantizedDimensions, SmallVectorImpl< int64_t > &blockSizes)
Parses block size information for sub-channel quantization, assuming the leading '{' has already been...
Definition: TypeParser.cpp:207

printQuantParams
static void printQuantParams(double scale, int64_t zeroPoint, DialectAsmPrinter &out)
Definition: TypeParser.cpp:504

parseCalibratedType
static Type parseCalibratedType(DialectAsmParser &parser)
Parses an CalibratedQuantizedType.
Definition: TypeParser.cpp:446

parseQuantParamListUntilRBrace
static ParseResult parseQuantParamListUntilRBrace(DialectAsmParser &parser, Type expressedType, SmallVectorImpl< double > &scales, SmallVectorImpl< int64_t > &zeroPoints, SmallVectorImpl< int64_t > &dims)
Parses a bracketed list of quantization parameters, returning the dimensions of the parsed sub-tensor...
Definition: TypeParser.cpp:246

parseStorageRange
static ParseResult parseStorageRange(DialectAsmParser &parser, IntegerType storageType, bool isSigned, int64_t &storageTypeMin, int64_t &storageTypeMax)
Definition: TypeParser.cpp:58

printCalibratedQuantizedType
static void printCalibratedQuantizedType(CalibratedQuantizedType type, DialectAsmPrinter &out)
Helper that prints a CalibratedQuantizedType.
Definition: TypeParser.cpp:637

printUniformQuantizedPerAxisType
static void printUniformQuantizedPerAxisType(UniformQuantizedPerAxisType type, DialectAsmPrinter &out)
Helper that prints a UniformQuantizedPerAxisType.
Definition: TypeParser.cpp:547

printUniformQuantizedType
static void printUniformQuantizedType(UniformQuantizedType type, DialectAsmPrinter &out)
Helper that prints a UniformQuantizedType.
Definition: TypeParser.cpp:535

Types.h

max
static Value max(ImplicitLocOpBuilder &builder, Value value, Value bound)
Definition: PolynomialApproximation.cpp:212

min
static Value min(ImplicitLocOpBuilder &builder, Value value, Value bound)
Definition: PolynomialApproximation.cpp:204

QuantTypes.h

llvm::ArrayRef
Definition: LLVM.h:48

llvm::SmallVectorImpl
Definition: LLVM.h:74

llvm::SmallVector
Definition: LLVM.h:72

llvm::function_ref
Definition: LLVM.h:90

mlir::AsmParser::parseLBrace
virtual ParseResult parseLBrace()=0
Parse a { token.

mlir::AsmParser::parseOptionalRBrace
virtual ParseResult parseOptionalRBrace()=0
Parse a } token if present.

mlir::AsmParser::parseCommaSeparatedList
virtual ParseResult parseCommaSeparatedList(Delimiter delimiter, function_ref< ParseResult()> parseElementFn, StringRef contextMessage=StringRef())=0
Parse a list of comma-separated items with an optional delimiter.

mlir::AsmParser::getBuilder
virtual Builder & getBuilder() const =0
Return a builder which provides useful access to MLIRContext, global objects like types and attribute...

mlir::AsmParser::parseOptionalType
virtual OptionalParseResult parseOptionalType(Type &result)=0
Parse an optional type.

mlir::AsmParser::emitError
virtual InFlightDiagnostic emitError(SMLoc loc, const Twine &message={})=0
Emit a diagnostic at the specified location and return failure.

mlir::AsmParser::parseOptionalColon
virtual ParseResult parseOptionalColon()=0
Parse a : token if present.

mlir::AsmParser::parseInteger
ParseResult parseInteger(IntT &result)
Parse an integer value from the stream.
Definition: OpImplementation.h:752

mlir::AsmParser::parseRBrace
virtual ParseResult parseRBrace()=0
Parse a } token.

mlir::AsmParser::parseLess
virtual ParseResult parseLess()=0
Parse a '<' token.

mlir::AsmParser::getCurrentLocation
virtual SMLoc getCurrentLocation()=0
Get the location of the next token and store it into the argument.

mlir::AsmParser::getChecked
auto getChecked(SMLoc loc, ParamsT &&...params)
Invoke the getChecked method of the given Attribute or Type class, using the provided location to emi...
Definition: OpImplementation.h:971

mlir::AsmParser::parseColon
virtual ParseResult parseColon()=0
Parse a : token.

mlir::AsmParser::getNameLoc
virtual SMLoc getNameLoc() const =0
Return the location of the original name token.

mlir::AsmParser::parseOptionalLess
virtual ParseResult parseOptionalLess()=0
Parse a '<' token if present.

mlir::AsmParser::parseGreater
virtual ParseResult parseGreater()=0
Parse a '>' token.

mlir::AsmParser::parseType
virtual ParseResult parseType(Type &result)=0
Parse a type.

mlir::AsmParser::parseComma
virtual ParseResult parseComma()=0
Parse a , token.

mlir::AsmParser::parseFloat
virtual ParseResult parseFloat(double &result)=0
Parse a floating point value from the stream.

mlir::AsmParser::parseKeyword
ParseResult parseKeyword(StringRef keyword)
Parse a given keyword.
Definition: OpImplementation.h:926

mlir::AsmParser::parseOptionalLBrace
virtual ParseResult parseOptionalLBrace()=0
Parse a { token if present.

mlir::Builder::getIntegerType
IntegerType getIntegerType(unsigned width)
Definition: Builders.cpp:66

mlir::DenseElementsAttr::getValues
auto getValues() const
Return the held element values as a range of the given type.
Definition: BuiltinAttributes.h:421

mlir::DenseElementsAttr::get
static DenseElementsAttr get(ShapedType type, ArrayRef< Attribute > values)
Constructs a dense elements attribute from an array of element values.
Definition: BuiltinAttributes.cpp:909

mlir::DenseElementsAttr::getType
ShapedType getType() const
Return the type of this ElementsAttr, guaranteed to be a vector or tensor with static shape.
Definition: BuiltinAttributes.cpp:1298

mlir::DialectAsmParser
The DialectAsmParser has methods for interacting with the asm parser when parsing attributes and type...
Definition: DialectImplementation.h:56

mlir::DialectAsmPrinter
This is a pure-virtual base class that exposes the asmprinter hooks necessary to implement a custom p...
Definition: DialectImplementation.h:44

mlir::InFlightDiagnostic
This class represents a diagnostic that is inflight and set to be reported.
Definition: Diagnostics.h:314

mlir::OptionalParseResult
This class implements Optional functionality for ParseResult.
Definition: OpDefinition.h:40

mlir::OptionalParseResult::has_value
bool has_value() const
Returns true if we contain a valid ParseResult value.
Definition: OpDefinition.h:50

mlir::Type
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
Definition: Types.h:74

mlir::quant::AnyQuantizedType
A quantized type that maps storage to/from expressed types in an unspecified way.
Definition: QuantTypes.h:201

mlir::quant::CalibratedQuantizedType
A quantized type that infers its range from given min/max values.
Definition: QuantTypes.h:522

mlir::quant::CalibratedQuantizedType::getMax
double getMax() const
Definition: QuantTypes.cpp:555

mlir::quant::CalibratedQuantizedType::getMin
double getMin() const
Definition: QuantTypes.cpp:553

mlir::quant::QuantizedType
Base class for all quantized types known to this dialect.
Definition: QuantTypes.h:50

mlir::quant::QuantizedType::MaxStorageBits
static constexpr unsigned MaxStorageBits
The maximum number of bits supported for storage types.
Definition: QuantTypes.h:56

mlir::quant::QuantizedType::hasStorageTypeBounds
bool hasStorageTypeBounds() const
Return whether the storage type has explicit min or max boundaries different from the minimum and max...
Definition: QuantTypes.cpp:89

mlir::quant::QuantizedType::isSigned
bool isSigned() const
Whether the storage type should be interpreted as a signed quantity (true) or an unsigned value (fals...
Definition: QuantTypes.h:103

mlir::quant::QuantizedType::getStorageTypeMax
int64_t getStorageTypeMax() const
The maximum value that storageType can take.
Definition: QuantTypes.cpp:85

mlir::quant::QuantizedType::getDefaultMaximumForInteger
static int64_t getDefaultMaximumForInteger(bool isSigned, unsigned integralWidth)
Gets the maximum possible stored by a storageType.
Definition: QuantTypes.h:78

mlir::quant::QuantizedType::getStorageTypeIntegralWidth
unsigned getStorageTypeIntegralWidth() const
Gets the integral bit width that the underlying storage type can exactly represent.
Definition: QuantTypes.cpp:100

mlir::quant::QuantizedType::getStorageTypeMin
int64_t getStorageTypeMin() const
The minimum value that storageType can take.
Definition: QuantTypes.cpp:81

mlir::quant::QuantizedType::getDefaultMinimumForInteger
static int64_t getDefaultMinimumForInteger(bool isSigned, unsigned integralWidth)
Gets the minimum possible stored by a storageType.
Definition: QuantTypes.h:68

mlir::quant::UniformQuantizedPerAxisType
Represents per-axis (also known as per-channel quantization).
Definition: QuantTypes.h:322

mlir::quant::UniformQuantizedPerAxisType::getQuantizedDimension
int32_t getQuantizedDimension() const
Specifies the dimension of the Tensor's shape that the scales and zero_points correspond to.
Definition: QuantTypes.cpp:406

mlir::quant::UniformQuantizedPerAxisType::getZeroPoints
ArrayRef< int64_t > getZeroPoints() const
Gets the storage values corresponding to the real value 0 in the affine equation.
Definition: QuantTypes.cpp:402

mlir::quant::UniformQuantizedPerAxisType::getScales
ArrayRef< double > getScales() const
Gets the quantization scales.
Definition: QuantTypes.cpp:398

mlir::quant::UniformQuantizedSubChannelType
Represents sub-channel (also known as blockwise quantization).
Definition: QuantTypes.h:407

mlir::quant::UniformQuantizedSubChannelType::getZeroPoints
DenseElementsAttr getZeroPoints() const
Gets the quantization zero-points.
Definition: QuantTypes.cpp:501

mlir::quant::UniformQuantizedSubChannelType::getBlockSizeInfo
const SmallVector< std::pair< int32_t, int64_t > > getBlockSizeInfo() const
Gets the block size information.
Definition: QuantTypes.cpp:515

mlir::quant::UniformQuantizedSubChannelType::getScales
DenseElementsAttr getScales() const
Gets the quantization scales.
Definition: QuantTypes.cpp:497

mlir::quant::UniformQuantizedType
Represents a family of uniform, quantized types.
Definition: QuantTypes.h:262

mlir::quant::UniformQuantizedType::getScale
double getScale() const
Gets the scale term.
Definition: QuantTypes.cpp:329

mlir::quant::UniformQuantizedType::getZeroPoint
int64_t getZeroPoint() const
Gets the storage value corresponding to the real value 0 in the affine equation.
Definition: QuantTypes.cpp:331

Quant.h

BuiltinTypes.h

mlir::LLVM::detail::printType
void printType(Type type, AsmPrinter &printer)
Prints an LLVM Dialect type.
Definition: LLVMTypeSyntax.cpp:97

mlir::quant::QuantizationFlags::Signed
@ Signed
Definition: QuantTypes.h:38

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::emitError
InFlightDiagnostic emitError(Location loc)
Utility method to emit an error message using this location.
Definition: Diagnostics.cpp:328

mlir::get
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
Definition: BytecodeImplementation.h:509

mlir::parseType
Type parseType(llvm::StringRef typeStr, MLIRContext *context, size_t *numRead=nullptr, bool isKnownNullTerminated=false)
This parses a single MLIR type to an MLIR context if it was valid.