doxygen/QuantTypes_8cpp_source.html

//===- QuantOps.cpp - Quantization Type and Ops Implementation --*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//


#include "mlir/Dialect/Quant/IR/QuantTypes.h"

#include "TypeDetail.h"

#include "mlir/Dialect/Quant/IR/Quant.h"


#include "mlir/IR/BuiltinTypes.h"

#include "mlir/IR/MLIRContext.h"


using namespace mlir;

using namespace mlir::quant;

using namespace mlir::quant::detail;


namespace {


// Return the minimum scale representable in a given float type

double getMinScale(Type expressedType) {

  auto floatType = cast<FloatType>(expressedType);

  return APFloat::getSmallest(floatType.getFloatSemantics()).convertToDouble();

}


// Return the maximum scale representable in a given float type

double getMaxScale(Type expressedType) {

  auto floatType = cast<FloatType>(expressedType);

  return APFloat::getLargest(floatType.getFloatSemantics()).convertToDouble();

}


} // namespace


unsigned QuantizedType::getFlags() const {

  return static_cast<ImplType *>(impl)->flags;

}


bool QuantizedType::classof(Type type) {

  return llvm::isa<QuantDialect>(type.getDialect());

}


LogicalResult


QuantizedType::verifyInvariants(function_ref<InFlightDiagnostic()> emitError,

                                unsigned flags, Type storageType,

                                Type expressedType, int64_t storageTypeMin,

                                int64_t storageTypeMax) {

  // Verify that the storage type is integral.

  // This restriction may be lifted at some point in favor of using bf16

  // or f16 as exact representations on hardware where that is advantageous.

  auto intStorageType = llvm::dyn_cast<IntegerType>(storageType);

  if (!intStorageType)

    return emitError() << "storage type must be integral";

  unsigned integralWidth = intStorageType.getWidth();


  // Verify storage width.

  if (integralWidth == 0 || integralWidth > MaxStorageBits)

    return emitError() << "illegal storage type size: " << integralWidth;


  // Verify storageTypeMin and storageTypeMax.

  bool isSigned =

      (flags & QuantizationFlags::Signed) == QuantizationFlags::Signed;

  int64_t defaultIntegerMin =

      getDefaultMinimumForInteger(isSigned, integralWidth);

  int64_t defaultIntegerMax =

      getDefaultMaximumForInteger(isSigned, integralWidth);

  if (storageTypeMax - storageTypeMin <= 0 ||

      storageTypeMin < defaultIntegerMin ||

      storageTypeMax > defaultIntegerMax) {

    return emitError() << "illegal storage min and storage max: ("

                       << storageTypeMin << ":" << storageTypeMax << ")";

  }

  return success();

}


Type QuantizedType::getStorageType() const {

  return static_cast<ImplType *>(impl)->storageType;

}


int64_t QuantizedType::getStorageTypeMin() const {

  return static_cast<ImplType *>(impl)->storageTypeMin;

}


int64_t QuantizedType::getStorageTypeMax() const {

  return static_cast<ImplType *>(impl)->storageTypeMax;

}


bool QuantizedType::hasStorageTypeBounds() const {

  unsigned int integralWidth = getStorageTypeIntegralWidth();

  bool isSignedInteger = isSigned();

  int64_t defaultIntegerMin =

      getDefaultMinimumForInteger(isSignedInteger, integralWidth);

  int64_t defaultIntegerMax =

      getDefaultMaximumForInteger(isSignedInteger, integralWidth);

  return defaultIntegerMin != getStorageTypeMin() ||

         defaultIntegerMax != getStorageTypeMax();

}


unsigned QuantizedType::getStorageTypeIntegralWidth() const {

  // NOTE: If ever supporting non-integral storage types, some other scheme

  // for determining the width will be needed.

  return static_cast<ImplType *>(impl)->storageType.getIntOrFloatBitWidth();

}


Type QuantizedType::getExpressedType() const {

  return static_cast<ImplType *>(impl)->expressedType;

}


bool QuantizedType::isCompatibleExpressedType(Type candidateExpressedType) {

  if (llvm::isa<ShapedType>(candidateExpressedType)) {

    return llvm::cast<ShapedType>(candidateExpressedType).getElementType() ==

           getExpressedType();

  }

  return candidateExpressedType == getExpressedType();

}


QuantizedType


QuantizedType::getQuantizedElementType(Type primitiveOrContainerType) {

  if (llvm::isa<ShapedType>(primitiveOrContainerType)) {

    Type elementType =

        llvm::cast<ShapedType>(primitiveOrContainerType).getElementType();

    return llvm::dyn_cast<QuantizedType>(elementType);

  }

  return llvm::dyn_cast<QuantizedType>(primitiveOrContainerType);

}


Type QuantizedType::castFromStorageType(Type candidateType) {

  if (candidateType == getStorageType()) {

    // i.e. i8 -> quant<"uniform[i8:f32]{1.0}">

    return *this;

  }

  if (llvm::isa<RankedTensorType>(candidateType)) {

    // i.e. tensor<4xi8> -> tensor<4x!quant<"uniform[i8:f32]{1.0}">>

    return RankedTensorType::get(

        llvm::cast<RankedTensorType>(candidateType).getShape(),

        getStorageType());

  }

  if (llvm::isa<UnrankedTensorType>(candidateType)) {

    // i.e. tensor<xi8> -> tensor<x!quant<"uniform[i8:f32]{1.0}">>

    return UnrankedTensorType::get(getStorageType());

  }

  if (llvm::isa<VectorType>(candidateType)) {

    // i.e. vector<4xi8> -> vector<4x!quant<"uniform[i8:f32]{1.0}">>

    return VectorType::get(llvm::cast<VectorType>(candidateType).getShape(),

                           getStorageType());

  }


  return nullptr;

}


Type QuantizedType::castToStorageType(Type quantizedType) {

  if (llvm::isa<QuantizedType>(quantizedType)) {

    // i.e. quant<"uniform[i8:f32]{1.0}"> -> i8

    return llvm::cast<QuantizedType>(quantizedType).getStorageType();

  }

  if (llvm::isa<ShapedType>(quantizedType)) {

    // i.e. tensor<4xi8> -> tensor<4x!quant<"uniform[i8:f32]{1.0}">>

    ShapedType sType = llvm::cast<ShapedType>(quantizedType);

    if (!llvm::isa<QuantizedType>(sType.getElementType())) {

      return nullptr;

    }

    Type storageType =

        llvm::cast<QuantizedType>(sType.getElementType()).getStorageType();

    if (llvm::isa<RankedTensorType>(quantizedType)) {

      return RankedTensorType::get(sType.getShape(), storageType);

    }

    if (llvm::isa<UnrankedTensorType>(quantizedType)) {

      return UnrankedTensorType::get(storageType);

    }

    if (llvm::isa<VectorType>(quantizedType)) {

      return VectorType::get(sType.getShape(), storageType);

    }

  }


  return nullptr;

}


Type QuantizedType::castFromExpressedType(Type candidateType) {

  if (candidateType == getExpressedType()) {

    // i.e. f32 -> quant<"uniform[i8:f32]{1.0}">

    return *this;

  }

  if (llvm::isa<ShapedType>(candidateType)) {

    ShapedType candidateShapedType = llvm::cast<ShapedType>(candidateType);

    if (candidateShapedType.getElementType() != getExpressedType()) {

      return nullptr;

    }


    if (llvm::isa<RankedTensorType>(candidateType)) {

      // i.e. tensor<4xf32> -> tensor<4x!quant<"uniform[i8:f32]{1.0}">>

      return RankedTensorType::get(candidateShapedType.getShape(), *this);

    }

    if (llvm::isa<UnrankedTensorType>(candidateType)) {

      // i.e. tensor<xf32> -> tensor<x!quant<"uniform[i8:f32]{1.0}">>

      return UnrankedTensorType::get(*this);

    }

    if (llvm::isa<VectorType>(candidateType)) {

      // i.e. tensor<4xf32> -> tensor<4x!quant<"uniform[i8:f32]{1.0}">>

      return VectorType::get(candidateShapedType.getShape(), *this);

    }

  }


  return nullptr;

}


Type QuantizedType::castToExpressedType(Type quantizedType) {

  if (llvm::isa<QuantizedType>(quantizedType)) {

    // i.e. quant<"uniform[i8:f32]{1.0}"> -> f32

    return llvm::cast<QuantizedType>(quantizedType).getExpressedType();

  }

  if (llvm::isa<ShapedType>(quantizedType)) {

    // i.e. tensor<4xi8> -> tensor<4x!quant<"uniform[i8:f32]{1.0}">>

    ShapedType sType = llvm::cast<ShapedType>(quantizedType);

    if (!llvm::isa<QuantizedType>(sType.getElementType())) {

      return nullptr;

    }

    Type expressedType =

        llvm::cast<QuantizedType>(sType.getElementType()).getExpressedType();

    if (llvm::isa<RankedTensorType>(quantizedType)) {

      return RankedTensorType::get(sType.getShape(), expressedType);

    }

    if (llvm::isa<UnrankedTensorType>(quantizedType)) {

      return UnrankedTensorType::get(expressedType);

    }

    if (llvm::isa<VectorType>(quantizedType)) {

      return VectorType::get(sType.getShape(), expressedType);

    }

  }


  return nullptr;

}


Type QuantizedType::castExpressedToStorageType(Type candidateType) {

  Type expressedQuantizedType = castFromExpressedType(candidateType);

  if (!expressedQuantizedType) {

    return nullptr;

  }

  return QuantizedType::castToStorageType(expressedQuantizedType);

}


AnyQuantizedType AnyQuantizedType::get(unsigned flags, Type storageType,

                                       Type expressedType,

                                       int64_t storageTypeMin,

                                       int64_t storageTypeMax) {

  return Base::get(storageType.getContext(), flags, storageType, expressedType,

                   storageTypeMin, storageTypeMax);

}


AnyQuantizedType


AnyQuantizedType::getChecked(function_ref<InFlightDiagnostic()> emitError,

                             unsigned flags, Type storageType,

                             Type expressedType, int64_t storageTypeMin,

                             int64_t storageTypeMax) {

  return Base::getChecked(emitError, storageType.getContext(), flags,

                          storageType, expressedType, storageTypeMin,

                          storageTypeMax);

}


LogicalResult


AnyQuantizedType::verifyInvariants(function_ref<InFlightDiagnostic()> emitError,

                                   unsigned flags, Type storageType,

                                   Type expressedType, int64_t storageTypeMin,

                                   int64_t storageTypeMax) {

  if (failed(QuantizedType::verifyInvariants(emitError, flags, storageType,

                                             expressedType, storageTypeMin,

                                             storageTypeMax))) {

    return failure();

  }


  // Verify that the expressed type is floating point.

  // If this restriction is ever eliminated, the parser/printer must be

  // extended.

  if (expressedType && !llvm::isa<FloatType>(expressedType))

    return emitError() << "expressed type must be floating point";


  return success();

}


UniformQuantizedType UniformQuantizedType::get(unsigned flags, Type storageType,

                                               Type expressedType, double scale,

                                               int64_t zeroPoint,

                                               int64_t storageTypeMin,

                                               int64_t storageTypeMax) {

  return Base::get(storageType.getContext(), flags, storageType, expressedType,

                   scale, zeroPoint, storageTypeMin, storageTypeMax);

}


UniformQuantizedType UniformQuantizedType::getChecked(

    function_ref<InFlightDiagnostic()> emitError, unsigned flags,

    Type storageType, Type expressedType, double scale, int64_t zeroPoint,

    int64_t storageTypeMin, int64_t storageTypeMax) {

  return Base::getChecked(emitError, storageType.getContext(), flags,

                          storageType, expressedType, scale, zeroPoint,

                          storageTypeMin, storageTypeMax);

}


LogicalResult UniformQuantizedType::verifyInvariants(

    function_ref<InFlightDiagnostic()> emitError, unsigned flags,

    Type storageType, Type expressedType, double scale, int64_t zeroPoint,

    int64_t storageTypeMin, int64_t storageTypeMax) {

  if (failed(QuantizedType::verifyInvariants(emitError, flags, storageType,

                                             expressedType, storageTypeMin,

                                             storageTypeMax))) {

    return failure();

  }


  // Uniform quantization requires fully expressed parameters, including

  // expressed type.

  if (!expressedType)

    return emitError() << "uniform quantization requires expressed type";


  // Verify that the expressed type is floating point.

  // If this restriction is ever eliminated, the parser/printer must be

  // extended.

  if (!llvm::isa<FloatType>(expressedType))

    return emitError() << "expressed type must be floating point";


  // Verify scale.

  double minScale = getMinScale(expressedType);

  double maxScale = getMaxScale(expressedType);

  if (scale < minScale || scale > maxScale)

    return emitError() << "scale out of expressed type range [" << minScale

                       << ", " << maxScale << "]";


  return success();

}


double UniformQuantizedType::getScale() const { return getImpl()->scale; }


int64_t UniformQuantizedType::getZeroPoint() const {

  return getImpl()->zeroPoint;

}


UniformQuantizedPerAxisType UniformQuantizedPerAxisType::get(

    unsigned flags, Type storageType, Type expressedType,

    ArrayRef<double> scales, ArrayRef<int64_t> zeroPoints,

    int32_t quantizedDimension, int64_t storageTypeMin,

    int64_t storageTypeMax) {

  return Base::get(storageType.getContext(), flags, storageType, expressedType,

                   scales, zeroPoints, quantizedDimension, storageTypeMin,

                   storageTypeMax);

}


UniformQuantizedPerAxisType UniformQuantizedPerAxisType::getChecked(

    function_ref<InFlightDiagnostic()> emitError, unsigned flags,

    Type storageType, Type expressedType, ArrayRef<double> scales,

    ArrayRef<int64_t> zeroPoints, int32_t quantizedDimension,

    int64_t storageTypeMin, int64_t storageTypeMax) {

  return Base::getChecked(emitError, storageType.getContext(), flags,

                          storageType, expressedType, scales, zeroPoints,

                          quantizedDimension, storageTypeMin, storageTypeMax);

}


LogicalResult UniformQuantizedPerAxisType::verifyInvariants(

    function_ref<InFlightDiagnostic()> emitError, unsigned flags,

    Type storageType, Type expressedType, ArrayRef<double> scales,

    ArrayRef<int64_t> zeroPoints, int32_t quantizedDimension,

    int64_t storageTypeMin, int64_t storageTypeMax) {

  if (failed(QuantizedType::verifyInvariants(emitError, flags, storageType,

                                             expressedType, storageTypeMin,

                                             storageTypeMax))) {

    return failure();

  }


  // Uniform quantization requires fully expressed parameters, including

  // expressed type.

  if (!expressedType)

    return emitError() << "uniform quantization requires expressed type";


  // Verify that the expressed type is floating point.

  // If this restriction is ever eliminated, the parser/printer must be

  // extended.

  if (!llvm::isa<FloatType>(expressedType))

    return emitError() << "expressed type must be floating point";


  // Ensure that the number of scales and zeroPoints match.

  if (scales.size() != zeroPoints.size())

    return emitError() << "illegal number of scales and zeroPoints: "

                       << scales.size() << ", " << zeroPoints.size();


  // Verify scale.

  double minScale = getMinScale(expressedType);

  double maxScale = getMaxScale(expressedType);

  for (double scale : scales) {

    if (scale < minScale || scale > maxScale)

      return emitError() << "scale out of expressed type range [" << minScale

                         << ", " << maxScale << "]";

  }


  // Verify quantized dimension.

  if (quantizedDimension < 0)

    return emitError() << "illegal quantized dimension: " << quantizedDimension;


  return success();

}


ArrayRef<double> UniformQuantizedPerAxisType::getScales() const {

  return getImpl()->getScales();

}


ArrayRef<int64_t> UniformQuantizedPerAxisType::getZeroPoints() const {

  return getImpl()->getZeroPoints();

}


int32_t UniformQuantizedPerAxisType::getQuantizedDimension() const {

  return getImpl()->quantizedDimension;

}


UniformQuantizedSubChannelType UniformQuantizedSubChannelType::get(

    unsigned flags, Type storageType, Type expressedType,

    DenseElementsAttr scales, DenseElementsAttr zeroPoints,

    ArrayRef<int32_t> quantizedDimensions, ArrayRef<int64_t> blockSizes,

    int64_t storageTypeMin, int64_t storageTypeMax) {

  return Base::get(storageType.getContext(), flags, storageType, expressedType,

                   scales, zeroPoints, quantizedDimensions, blockSizes,

                   storageTypeMin, storageTypeMax);

}


UniformQuantizedSubChannelType UniformQuantizedSubChannelType::getChecked(

    function_ref<InFlightDiagnostic()> emitError, unsigned flags,

    Type storageType, Type expressedType, DenseElementsAttr scales,

    DenseElementsAttr zeroPoints, ArrayRef<int32_t> quantizedDimensions,

    ArrayRef<int64_t> blockSizes, int64_t storageTypeMin,

    int64_t storageTypeMax) {

  return Base::getChecked(emitError, storageType.getContext(), flags,

                          storageType, expressedType, scales, zeroPoints,

                          quantizedDimensions, blockSizes, storageTypeMin,

                          storageTypeMax);

}


LogicalResult UniformQuantizedSubChannelType::verifyInvariants(

    function_ref<InFlightDiagnostic()> emitError, unsigned flags,

    Type storageType, Type expressedType, DenseElementsAttr scales,

    DenseElementsAttr zeroPoints, ArrayRef<int32_t> quantizedDimensions,

    ArrayRef<int64_t> blockSizes, int64_t storageTypeMin,

    int64_t storageTypeMax) {

  if (failed(QuantizedType::verifyInvariants(emitError, flags, storageType,

                                             expressedType, storageTypeMin,

                                             storageTypeMax))) {

    return failure();

  }


  // Uniform quantization requires fully expressed parameters, including

  // expressed type.

  if (!expressedType)

    return emitError() << "uniform quantization requires expressed type";


  // Verify that the expressed type is floating point.

  // If this restriction is ever eliminated, the parser/printer must be

  // extended.

  if (!llvm::isa<FloatType>(expressedType))

    return emitError() << "expressed type must be floating point";


  // Verify scale type to match expressedType.

  if (scales.getType().getElementType() != expressedType) {

    return emitError() << "type of scale values "

                       << scales.getType().getElementType()

                       << " must match the expressed type " << expressedType;

  }


  // Verify zero-point type to match storageType.

  if (zeroPoints.getType().getElementType() != storageType) {

    return emitError() << "type of zero point values "

                       << zeroPoints.getType().getElementType()

                       << " must match the storage type " << storageType;

  }


  // Ensure that the shape of scales and zeroPoints match.

  if (scales.getType().getShape() != zeroPoints.getType().getShape())

    return emitError() << "shape of scales and zeroPoints ("

                       << scales.getType().getShape() << " vs "

                       << zeroPoints.getType().getShape() << ") does not match";


  // Ensure that the number of quantized-dimensions and block-sizes match.

  if (quantizedDimensions.size() != blockSizes.size())

    return emitError() << "number of quantized dimensions and block sizes ("

                       << scales.size() << " vs " << zeroPoints.size()

                       << ") does not match";


  // Verify quantized dimension.

  for (auto quantizedDimension : quantizedDimensions) {

    if (quantizedDimension < 0)

      return emitError() << "illegal quantized dimension: "

                         << quantizedDimension;

  }


  // Verify block sizes.

  for (auto blockSize : blockSizes) {

    if (blockSize <= 0)

      return emitError() << "illegal block size: " << blockSize;

  }


  return success();

}


DenseElementsAttr UniformQuantizedSubChannelType::getScales() const {

  return getImpl()->getScales();

}


DenseElementsAttr UniformQuantizedSubChannelType::getZeroPoints() const {

  return getImpl()->getZeroPoints();

}


ArrayRef<int32_t>


UniformQuantizedSubChannelType::getQuantizedDimensions() const {

  return getImpl()->getQuantizedDimensions();

}


ArrayRef<int64_t> UniformQuantizedSubChannelType::getBlockSizes() const {

  return getImpl()->getBlockSizes();

}


const SmallVector<std::pair<int32_t, int64_t>>


UniformQuantizedSubChannelType::getBlockSizeInfo() const {

  SmallVector<std::pair<int32_t, int64_t>> result;

  result.reserve(getQuantizedDimensions().size());


  for (auto [dim, size] :

       llvm::zip(getQuantizedDimensions(), getBlockSizes())) {

    result.push_back({dim, size});

  }


  return result;

}


CalibratedQuantizedType CalibratedQuantizedType::get(Type expressedType,

                                                     double min, double max) {

  return Base::get(expressedType.getContext(), expressedType, min, max);

}


CalibratedQuantizedType CalibratedQuantizedType::getChecked(

    function_ref<InFlightDiagnostic()> emitError, Type expressedType,

    double min, double max) {

  return Base::getChecked(emitError, expressedType.getContext(), expressedType,

                          min, max);

}


LogicalResult CalibratedQuantizedType::verifyInvariants(

    function_ref<InFlightDiagnostic()> emitError, Type expressedType,

    double min, double max) {

  // Verify that the expressed type is floating point.

  // If this restriction is ever eliminated, the parser/printer must be

  // extended.

  if (!llvm::isa<FloatType>(expressedType))

    return emitError() << "expressed type must be floating point";

  if (max <= min)

    return emitError() << "illegal min and max: (" << min << ":" << max << ")";


  return success();

}


double CalibratedQuantizedType::getMin() const { return getImpl()->min; }


double CalibratedQuantizedType::getMax() const { return getImpl()->max; }

success
return success()

TypeDetail.h

result
result
Definition LinalgTransformOps.cpp:2097

MLIRContext.h

max
static Value max(ImplicitLocOpBuilder &builder, Value value, Value bound)
Definition PolynomialApproximation.cpp:212

min
static Value min(ImplicitLocOpBuilder &builder, Value value, Value bound)
Definition PolynomialApproximation.cpp:204

QuantTypes.h

getShape
static ArrayRef< int64_t > getShape(Type type)
Returns the shape of the given type.
Definition Traits.cpp:117

int64_t

llvm::ArrayRef
Definition LLVM.h:48

llvm::SmallVector
Definition LLVM.h:72

mlir::DenseElementsAttr
An attribute that represents a reference to a dense vector or tensor object.
Definition BuiltinAttributes.h:82

mlir::DenseElementsAttr::size
int64_t size() const
Returns the number of elements held by this attribute.
Definition BuiltinAttributes.h:608

mlir::DenseElementsAttr::getType
ShapedType getType() const
Return the type of this ElementsAttr, guaranteed to be a vector or tensor with static shape.
Definition BuiltinAttributes.cpp:1293

mlir::InFlightDiagnostic
This class represents a diagnostic that is inflight and set to be reported.
Definition Diagnostics.h:316

mlir::Type
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
Definition Types.h:74

mlir::Type::getDialect
Dialect & getDialect() const
Get the dialect this type is registered to.
Definition Types.h:107

mlir::Type::getContext
MLIRContext * getContext() const
Return the MLIRContext in which this type was uniqued.
Definition Types.cpp:35

mlir::Type::isSignedInteger
bool isSignedInteger() const
Return true if this is a signed integer type (with the specified width).
Definition Types.cpp:76

mlir::detail::StorageUserBase< ConcreteType, BaseType, StorageType, detail::TypeUniquer, Traits... >::get
static ConcreteType get(MLIRContext *ctx, Args &&...args)
Definition StorageUniquerSupport.h:177

mlir::detail::StorageUserBase< ConcreteType, BaseType, StorageType, detail::TypeUniquer, Traits... >::getChecked
static ConcreteType getChecked(const Location &loc, Args &&...args)
Definition StorageUniquerSupport.h:189

mlir::detail::StorageUserBase< ConcreteType, BaseType, StorageType, detail::TypeUniquer, Traits... >::getImpl
ImplType * getImpl() const
Definition StorageUniquerSupport.h:212

mlir::quant::AnyQuantizedType
A quantized type that maps storage to/from expressed types in an unspecified way.
Definition QuantTypes.h:203

mlir::quant::AnyQuantizedType::get
static AnyQuantizedType get(unsigned flags, Type storageType, Type expressedType, int64_t storageTypeMin, int64_t storageTypeMax)
Gets an instance of the type with all parameters specified but not checked.
Definition QuantTypes.cpp:242

mlir::quant::AnyQuantizedType::verifyInvariants
static LogicalResult verifyInvariants(function_ref< InFlightDiagnostic()> emitError, unsigned flags, Type storageType, Type expressedType, int64_t storageTypeMin, int64_t storageTypeMax)
Verifies construction invariants and issues errors/warnings.
Definition QuantTypes.cpp:261

mlir::quant::AnyQuantizedType::getChecked
static AnyQuantizedType getChecked(function_ref< InFlightDiagnostic()> emitError, unsigned flags, Type storageType, Type expressedType, int64_t storageTypeMin, int64_t storageTypeMax)
Gets an instance of the type with all specified parameters checked.
Definition QuantTypes.cpp:251

mlir::quant::CalibratedQuantizedType
A quantized type that infers its range from given min/max values.
Definition QuantTypes.h:524

mlir::quant::CalibratedQuantizedType::getMax
double getMax() const
Definition QuantTypes.cpp:555

mlir::quant::CalibratedQuantizedType::getMin
double getMin() const
Definition QuantTypes.cpp:553

mlir::quant::CalibratedQuantizedType::verifyInvariants
static LogicalResult verifyInvariants(function_ref< InFlightDiagnostic()> emitError, Type expressedType, double min, double max)
Verifies construction invariants and issues errors/warnings.
Definition QuantTypes.cpp:539

mlir::quant::CalibratedQuantizedType::get
static CalibratedQuantizedType get(Type expressedType, double min, double max)
Gets an instance of the type with all parameters specified but not checked.
Definition QuantTypes.cpp:527

mlir::quant::CalibratedQuantizedType::getChecked
static CalibratedQuantizedType getChecked(function_ref< InFlightDiagnostic()> emitError, Type expressedType, double min, double max)
Gets an instance of the type with all specified parameters checked.
Definition QuantTypes.cpp:532

mlir::quant::QuantizedType
Base class for all quantized types known to this dialect.
Definition QuantTypes.h:50

mlir::quant::QuantizedType::getExpressedType
Type getExpressedType() const
Gets the original expressed type that this quantized type approximates.
Definition QuantTypes.cpp:106

mlir::quant::QuantizedType::MaxStorageBits
static constexpr unsigned MaxStorageBits
The maximum number of bits supported for storage types.
Definition QuantTypes.h:56

mlir::quant::QuantizedType::hasStorageTypeBounds
bool hasStorageTypeBounds() const
Return whether the storage type has explicit min or max boundaries different from the minimum and max...
Definition QuantTypes.cpp:89

mlir::quant::QuantizedType::castToStorageType
static Type castToStorageType(Type quantizedType)
Casts from a type based on a QuantizedType to a corresponding type based on the storageType (returns ...
Definition QuantTypes.cpp:152

mlir::quant::QuantizedType::castExpressedToStorageType
Type castExpressedToStorageType(Type candidateType)
Casts from a type based on the expressedType to the equivalent type based on storageType by way of th...
Definition QuantTypes.cpp:234

mlir::quant::QuantizedType::ImplType
detail::QuantizedTypeStorage ImplType
Definition QuantTypes.h:52

mlir::quant::QuantizedType::castToExpressedType
static Type castToExpressedType(Type quantizedType)
Casts from a type based on QuantizedType to a corresponding type based on the expressedType (returns ...
Definition QuantTypes.cpp:207

mlir::quant::QuantizedType::isSigned
bool isSigned() const
Whether the storage type should be interpreted as a signed quantity (true) or an unsigned value (fals...
Definition QuantTypes.h:103

mlir::quant::QuantizedType::Type
constexpr Type()=default

mlir::quant::QuantizedType::getQuantizedElementType
static QuantizedType getQuantizedElementType(Type primitiveOrContainerType)
Returns the element type as a QuantizedType or nullptr if it is not a quantized type.
Definition QuantTypes.cpp:119

mlir::quant::QuantizedType::getFlags
unsigned getFlags() const
Gets the flags associated with this type.
Definition QuantTypes.cpp:36

mlir::quant::QuantizedType::getStorageTypeMax
int64_t getStorageTypeMax() const
The maximum value that storageType can take.
Definition QuantTypes.cpp:85

mlir::quant::QuantizedType::getDefaultMaximumForInteger
static int64_t getDefaultMaximumForInteger(bool isSigned, unsigned integralWidth)
Gets the maximum possible stored by a storageType.
Definition QuantTypes.h:78

mlir::quant::QuantizedType::getStorageTypeIntegralWidth
unsigned getStorageTypeIntegralWidth() const
Gets the integral bit width that the underlying storage type can exactly represent.
Definition QuantTypes.cpp:100

mlir::quant::QuantizedType::classof
static bool classof(Type type)
Support method to enable LLVM-style type casting.
Definition QuantTypes.cpp:40

mlir::quant::QuantizedType::castFromStorageType
Type castFromStorageType(Type candidateType)
Casts from a type based on the storageType to a corresponding type based on this type (returns nullpt...
Definition QuantTypes.cpp:128

mlir::quant::QuantizedType::getStorageTypeMin
int64_t getStorageTypeMin() const
The minimum value that storageType can take.
Definition QuantTypes.cpp:81

mlir::quant::QuantizedType::getDefaultMinimumForInteger
static int64_t getDefaultMinimumForInteger(bool isSigned, unsigned integralWidth)
Gets the minimum possible stored by a storageType.
Definition QuantTypes.h:68

mlir::quant::QuantizedType::getStorageType
Type getStorageType() const
Gets the underlying type used for to store values.
Definition QuantTypes.cpp:77

mlir::quant::QuantizedType::castFromExpressedType
Type castFromExpressedType(Type candidateType)
Casts from a type based on the expressedType to a corresponding type based on this type (returns null...
Definition QuantTypes.cpp:179

mlir::quant::QuantizedType::isCompatibleExpressedType
bool isCompatibleExpressedType(Type candidateExpressedType)
Returns whether the candidateExpressedType is a match for this QuantizedType.
Definition QuantTypes.cpp:110

mlir::quant::QuantizedType::verifyInvariants
static LogicalResult verifyInvariants(function_ref< InFlightDiagnostic()> emitError, unsigned flags, Type storageType, Type expressedType, int64_t storageTypeMin, int64_t storageTypeMax)
Definition QuantTypes.cpp:45

mlir::quant::UniformQuantizedPerAxisType
Represents per-axis (also known as per-channel quantization).
Definition QuantTypes.h:324

mlir::quant::UniformQuantizedPerAxisType::getChecked
static UniformQuantizedPerAxisType getChecked(function_ref< InFlightDiagnostic()> emitError, unsigned flags, Type storageType, Type expressedType, ArrayRef< double > scales, ArrayRef< int64_t > zeroPoints, int32_t quantizedDimension, int64_t storageTypeMin, int64_t storageTypeMax)
Gets an instance of the type with all specified parameters checked.
Definition QuantTypes.cpp:345

mlir::quant::UniformQuantizedPerAxisType::get
static UniformQuantizedPerAxisType get(unsigned flags, Type storageType, Type expressedType, ArrayRef< double > scales, ArrayRef< int64_t > zeroPoints, int32_t quantizedDimension, int64_t storageTypeMin, int64_t storageTypeMax)
Gets an instance of the type with all parameters specified but not checked.
Definition QuantTypes.cpp:335

mlir::quant::UniformQuantizedPerAxisType::getQuantizedDimension
int32_t getQuantizedDimension() const
Specifies the dimension of the Tensor's shape that the scales and zero_points correspond to.
Definition QuantTypes.cpp:406

mlir::quant::UniformQuantizedPerAxisType::getZeroPoints
ArrayRef< int64_t > getZeroPoints() const
Gets the storage values corresponding to the real value 0 in the affine equation.
Definition QuantTypes.cpp:402

mlir::quant::UniformQuantizedPerAxisType::getScales
ArrayRef< double > getScales() const
Gets the quantization scales.
Definition QuantTypes.cpp:398

mlir::quant::UniformQuantizedPerAxisType::verifyInvariants
static LogicalResult verifyInvariants(function_ref< InFlightDiagnostic()> emitError, unsigned flags, Type storageType, Type expressedType, ArrayRef< double > scales, ArrayRef< int64_t > zeroPoints, int32_t quantizedDimension, int64_t storageTypeMin, int64_t storageTypeMax)
Verifies construction invariants and issues errors/warnings.
Definition QuantTypes.cpp:355

mlir::quant::UniformQuantizedSubChannelType
Represents sub-channel (also known as blockwise quantization).
Definition QuantTypes.h:409

mlir::quant::UniformQuantizedSubChannelType::getQuantizedDimensions
ArrayRef< int32_t > getQuantizedDimensions() const
Gets the quantized dimensions.
Definition QuantTypes.cpp:506

mlir::quant::UniformQuantizedSubChannelType::getZeroPoints
DenseElementsAttr getZeroPoints() const
Gets the quantization zero-points.
Definition QuantTypes.cpp:501

mlir::quant::UniformQuantizedSubChannelType::getBlockSizes
ArrayRef< int64_t > getBlockSizes() const
Gets the block sizes for the quantized dimensions.
Definition QuantTypes.cpp:510

mlir::quant::UniformQuantizedSubChannelType::verifyInvariants
static LogicalResult verifyInvariants(function_ref< InFlightDiagnostic()> emitError, unsigned flags, Type storageType, Type expressedType, DenseElementsAttr scales, DenseElementsAttr zeroPoints, ArrayRef< int32_t > quantizedDimensions, ArrayRef< int64_t > blockSizes, int64_t storageTypeMin, int64_t storageTypeMax)
Verifies construction invariants and issues errors/warnings.
Definition QuantTypes.cpp:432

mlir::quant::UniformQuantizedSubChannelType::getBlockSizeInfo
const SmallVector< std::pair< int32_t, int64_t > > getBlockSizeInfo() const
Gets the block size information.
Definition QuantTypes.cpp:515

mlir::quant::UniformQuantizedSubChannelType::getChecked
static UniformQuantizedSubChannelType getChecked(function_ref< InFlightDiagnostic()> emitError, unsigned flags, Type storageType, Type expressedType, DenseElementsAttr scales, DenseElementsAttr zeroPoints, ArrayRef< int32_t > quantizedDimensions, ArrayRef< int64_t > blockSizes, int64_t storageTypeMin, int64_t storageTypeMax)
Gets an instance of the type with all specified parameters checked.
Definition QuantTypes.cpp:420

mlir::quant::UniformQuantizedSubChannelType::get
static UniformQuantizedSubChannelType get(unsigned flags, Type storageType, Type expressedType, DenseElementsAttr scales, DenseElementsAttr zeroPoints, ArrayRef< int32_t > quantizedDimensions, ArrayRef< int64_t > blockSizes, int64_t storageTypeMin, int64_t storageTypeMax)
Gets an instance of the type with all parameters specified but not checked.
Definition QuantTypes.cpp:410

mlir::quant::UniformQuantizedSubChannelType::getScales
DenseElementsAttr getScales() const
Gets the quantization scales.
Definition QuantTypes.cpp:497

mlir::quant::UniformQuantizedType
Represents a family of uniform, quantized types.
Definition QuantTypes.h:264

mlir::quant::UniformQuantizedType::getScale
double getScale() const
Gets the scale term.
Definition QuantTypes.cpp:329

mlir::quant::UniformQuantizedType::getZeroPoint
int64_t getZeroPoint() const
Gets the storage value corresponding to the real value 0 in the affine equation.
Definition QuantTypes.cpp:331

mlir::quant::UniformQuantizedType::verifyInvariants
static LogicalResult verifyInvariants(function_ref< InFlightDiagnostic()> emitError, unsigned flags, Type storageType, Type expressedType, double scale, int64_t zeroPoint, int64_t storageTypeMin, int64_t storageTypeMax)
Verifies construction invariants and issues errors/warnings.
Definition QuantTypes.cpp:298

mlir::quant::UniformQuantizedType::getChecked
static UniformQuantizedType getChecked(function_ref< InFlightDiagnostic()> emitError, unsigned flags, Type storageType, Type expressedType, double scale, int64_t zeroPoint, int64_t storageTypeMin, int64_t storageTypeMax)
Gets an instance of the type with all specified parameters checked.
Definition QuantTypes.cpp:289

mlir::quant::UniformQuantizedType::get
static UniformQuantizedType get(unsigned flags, Type storageType, Type expressedType, double scale, int64_t zeroPoint, int64_t storageTypeMin, int64_t storageTypeMax)
Gets an instance of the type with all parameters specified but not checked.
Definition QuantTypes.cpp:280

Quant.h

BuiltinTypes.h

impl
Definition RunnerUtils.h:80

mlir::quant::QuantizationFlags::Signed
@ Signed
Definition QuantTypes.h:38

mlir::quant::detail
Definition QuantTypes.h:22

mlir::quant
Definition Quant.h:25

mlir
Include the generated interface declarations.
Definition AliasAnalysis.h:19

mlir::emitError
InFlightDiagnostic emitError(Location loc)
Utility method to emit an error message using this location.
Definition Diagnostics.cpp:332

mlir::function_ref
llvm::function_ref< Fn > function_ref
Definition LLVM.h:152