doxygen/DialectQuant_8cpp_source.html

 //===- DialectQuant.cpp - 'quant' dialect submodule -----------------------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #include <cstdint>

 #include <vector>


 #include "mlir-c/BuiltinAttributes.h"

 #include "mlir-c/Dialect/Quant.h"

 #include "mlir-c/IR.h"

 #include "mlir/Bindings/Python/Nanobind.h"

 #include "mlir/Bindings/Python/NanobindAdaptors.h"


 namespace nb = nanobind;

 using namespace llvm;

 using namespace mlir;

 using namespace mlir::python::nanobind_adaptors;


 static void populateDialectQuantSubmodule(const nb::module_ &m) {

   //===-------------------------------------------------------------------===//

   // QuantizedType

   //===-------------------------------------------------------------------===//


   auto quantizedType =

       mlir_type_subclass(m, "QuantizedType", mlirTypeIsAQuantizedType);

   quantizedType.def_staticmethod(

       "default_minimum_for_integer",

       [](bool isSigned, unsigned integralWidth) {

         return mlirQuantizedTypeGetDefaultMinimumForInteger(isSigned,

                                                             integralWidth);

       },

       "Default minimum value for the integer with the specified signedness and "

       "bit width.",

       nb::arg("is_signed"), nb::arg("integral_width"));

   quantizedType.def_staticmethod(

       "default_maximum_for_integer",

       [](bool isSigned, unsigned integralWidth) {

         return mlirQuantizedTypeGetDefaultMaximumForInteger(isSigned,

                                                             integralWidth);

       },

       "Default maximum value for the integer with the specified signedness and "

       "bit width.",

       nb::arg("is_signed"), nb::arg("integral_width"));

   quantizedType.def_property_readonly(

       "expressed_type",

       [](MlirType type) { return mlirQuantizedTypeGetExpressedType(type); },

       "Type expressed by this quantized type.");

   quantizedType.def_property_readonly(

       "flags", [](MlirType type) { return mlirQuantizedTypeGetFlags(type); },

       "Flags of this quantized type (named accessors should be preferred to "

       "this)");

   quantizedType.def_property_readonly(

       "is_signed",

       [](MlirType type) { return mlirQuantizedTypeIsSigned(type); },

       "Signedness of this quantized type.");

   quantizedType.def_property_readonly(

       "storage_type",

       [](MlirType type) { return mlirQuantizedTypeGetStorageType(type); },

       "Storage type backing this quantized type.");

   quantizedType.def_property_readonly(

       "storage_type_min",

       [](MlirType type) { return mlirQuantizedTypeGetStorageTypeMin(type); },

       "The minimum value held by the storage type of this quantized type.");

   quantizedType.def_property_readonly(

       "storage_type_max",

       [](MlirType type) { return mlirQuantizedTypeGetStorageTypeMax(type); },

       "The maximum value held by the storage type of this quantized type.");

   quantizedType.def_property_readonly(

       "storage_type_integral_width",

       [](MlirType type) {

         return mlirQuantizedTypeGetStorageTypeIntegralWidth(type);

       },

       "The bitwidth of the storage type of this quantized type.");

   quantizedType.def(

       "is_compatible_expressed_type",

       [](MlirType type, MlirType candidate) {

         return mlirQuantizedTypeIsCompatibleExpressedType(type, candidate);

       },

       "Checks whether the candidate type can be expressed by this quantized "

       "type.",

       nb::arg("candidate"));

   quantizedType.def_property_readonly(

       "quantized_element_type",

       [](MlirType type) {

         return mlirQuantizedTypeGetQuantizedElementType(type);

       },

       "Element type of this quantized type expressed as quantized type.");

   quantizedType.def(

       "cast_from_storage_type",

       [](MlirType type, MlirType candidate) {

         MlirType castResult =

             mlirQuantizedTypeCastFromStorageType(type, candidate);

         if (!mlirTypeIsNull(castResult))

           return castResult;

         throw nb::type_error("Invalid cast.");

       },

       "Casts from a type based on the storage type of this quantized type to a "

       "corresponding type based on the quantized type. Raises TypeError if the "

       "cast is not valid.",

       nb::arg("candidate"));

   quantizedType.def_staticmethod(

       "cast_to_storage_type",

       [](MlirType type) {

         MlirType castResult = mlirQuantizedTypeCastToStorageType(type);

         if (!mlirTypeIsNull(castResult))

           return castResult;

         throw nb::type_error("Invalid cast.");

       },

       "Casts from a type based on a quantized type to a corresponding type "

       "based on the storage type of this quantized type. Raises TypeError if "

       "the cast is not valid.",

       nb::arg("type"));

   quantizedType.def(

       "cast_from_expressed_type",

       [](MlirType type, MlirType candidate) {

         MlirType castResult =

             mlirQuantizedTypeCastFromExpressedType(type, candidate);

         if (!mlirTypeIsNull(castResult))

           return castResult;

         throw nb::type_error("Invalid cast.");

       },

       "Casts from a type based on the expressed type of this quantized type to "

       "a corresponding type based on the quantized type. Raises TypeError if "

       "the cast is not valid.",

       nb::arg("candidate"));

   quantizedType.def_staticmethod(

       "cast_to_expressed_type",

       [](MlirType type) {

         MlirType castResult = mlirQuantizedTypeCastToExpressedType(type);

         if (!mlirTypeIsNull(castResult))

           return castResult;

         throw nb::type_error("Invalid cast.");

       },

       "Casts from a type based on a quantized type to a corresponding type "

       "based on the expressed type of this quantized type. Raises TypeError if "

       "the cast is not valid.",

       nb::arg("type"));

   quantizedType.def(

       "cast_expressed_to_storage_type",

       [](MlirType type, MlirType candidate) {

         MlirType castResult =

             mlirQuantizedTypeCastExpressedToStorageType(type, candidate);

         if (!mlirTypeIsNull(castResult))

           return castResult;

         throw nb::type_error("Invalid cast.");

       },

       "Casts from a type based on the expressed type of this quantized type to "

       "a corresponding type based on the storage type. Raises TypeError if the "

       "cast is not valid.",

       nb::arg("candidate"));


   quantizedType.get_class().attr("FLAG_SIGNED") =

       mlirQuantizedTypeGetSignedFlag();


   //===-------------------------------------------------------------------===//

   // AnyQuantizedType

   //===-------------------------------------------------------------------===//


   auto anyQuantizedType =

       mlir_type_subclass(m, "AnyQuantizedType", mlirTypeIsAAnyQuantizedType,

                          quantizedType.get_class());

   anyQuantizedType.def_classmethod(

       "get",

       [](nb::object cls, unsigned flags, MlirType storageType,

          MlirType expressedType, int64_t storageTypeMin,

          int64_t storageTypeMax) {

         return cls(mlirAnyQuantizedTypeGet(flags, storageType, expressedType,

                                            storageTypeMin, storageTypeMax));

       },

       "Gets an instance of AnyQuantizedType in the same context as the "

       "provided storage type.",

       nb::arg("cls"), nb::arg("flags"), nb::arg("storage_type"),

       nb::arg("expressed_type"), nb::arg("storage_type_min"),

       nb::arg("storage_type_max"));


   //===-------------------------------------------------------------------===//

   // UniformQuantizedType

   //===-------------------------------------------------------------------===//


   auto uniformQuantizedType = mlir_type_subclass(

       m, "UniformQuantizedType", mlirTypeIsAUniformQuantizedType,

       quantizedType.get_class());

   uniformQuantizedType.def_classmethod(

       "get",

       [](nb::object cls, unsigned flags, MlirType storageType,

          MlirType expressedType, double scale, int64_t zeroPoint,

          int64_t storageTypeMin, int64_t storageTypeMax) {

         return cls(mlirUniformQuantizedTypeGet(flags, storageType,

                                                expressedType, scale, zeroPoint,

                                                storageTypeMin, storageTypeMax));

       },

       "Gets an instance of UniformQuantizedType in the same context as the "

       "provided storage type.",

       nb::arg("cls"), nb::arg("flags"), nb::arg("storage_type"),

       nb::arg("expressed_type"), nb::arg("scale"), nb::arg("zero_point"),

       nb::arg("storage_type_min"), nb::arg("storage_type_max"));

   uniformQuantizedType.def_property_readonly(

       "scale",

       [](MlirType type) { return mlirUniformQuantizedTypeGetScale(type); },

       "The scale designates the difference between the real values "

       "corresponding to consecutive quantized values differing by 1.");

   uniformQuantizedType.def_property_readonly(

       "zero_point",

       [](MlirType type) { return mlirUniformQuantizedTypeGetZeroPoint(type); },

       "The storage value corresponding to the real value 0 in the affine "

       "equation.");

   uniformQuantizedType.def_property_readonly(

       "is_fixed_point",

       [](MlirType type) { return mlirUniformQuantizedTypeIsFixedPoint(type); },

       "Fixed point values are real numbers divided by a scale.");


   //===-------------------------------------------------------------------===//

   // UniformQuantizedPerAxisType

   //===-------------------------------------------------------------------===//

   auto uniformQuantizedPerAxisType = mlir_type_subclass(

       m, "UniformQuantizedPerAxisType", mlirTypeIsAUniformQuantizedPerAxisType,

       quantizedType.get_class());

   uniformQuantizedPerAxisType.def_classmethod(

       "get",

       [](nb::object cls, unsigned flags, MlirType storageType,

          MlirType expressedType, std::vector<double> scales,

          std::vector<int64_t> zeroPoints, int32_t quantizedDimension,

          int64_t storageTypeMin, int64_t storageTypeMax) {

         if (scales.size() != zeroPoints.size())

           throw nb::value_error(

               "Mismatching number of scales and zero points.");

         auto nDims = static_cast<intptr_t>(scales.size());

         return cls(mlirUniformQuantizedPerAxisTypeGet(

             flags, storageType, expressedType, nDims, scales.data(),

             zeroPoints.data(), quantizedDimension, storageTypeMin,

             storageTypeMax));

       },

       "Gets an instance of UniformQuantizedPerAxisType in the same context as "

       "the provided storage type.",

       nb::arg("cls"), nb::arg("flags"), nb::arg("storage_type"),

       nb::arg("expressed_type"), nb::arg("scales"), nb::arg("zero_points"),

       nb::arg("quantized_dimension"), nb::arg("storage_type_min"),

       nb::arg("storage_type_max"));

   uniformQuantizedPerAxisType.def_property_readonly(

       "scales",

       [](MlirType type) {

         intptr_t nDim = mlirUniformQuantizedPerAxisTypeGetNumDims(type);

         std::vector<double> scales;

         scales.reserve(nDim);

         for (intptr_t i = 0; i < nDim; ++i) {

           double scale = mlirUniformQuantizedPerAxisTypeGetScale(type, i);

           scales.push_back(scale);

         }

         return scales;

       },

       "The scales designate the difference between the real values "

       "corresponding to consecutive quantized values differing by 1. The ith "

       "scale corresponds to the ith slice in the quantized_dimension.");

   uniformQuantizedPerAxisType.def_property_readonly(

       "zero_points",

       [](MlirType type) {

         intptr_t nDim = mlirUniformQuantizedPerAxisTypeGetNumDims(type);

         std::vector<int64_t> zeroPoints;

         zeroPoints.reserve(nDim);

         for (intptr_t i = 0; i < nDim; ++i) {

           int64_t zeroPoint =

               mlirUniformQuantizedPerAxisTypeGetZeroPoint(type, i);

           zeroPoints.push_back(zeroPoint);

         }

         return zeroPoints;

       },

       "the storage values corresponding to the real value 0 in the affine "

       "equation. The ith zero point corresponds to the ith slice in the "

       "quantized_dimension.");

   uniformQuantizedPerAxisType.def_property_readonly(

       "quantized_dimension",

       [](MlirType type) {

         return mlirUniformQuantizedPerAxisTypeGetQuantizedDimension(type);

       },

       "Specifies the dimension of the shape that the scales and zero points "

       "correspond to.");

   uniformQuantizedPerAxisType.def_property_readonly(

       "is_fixed_point",

       [](MlirType type) {

         return mlirUniformQuantizedPerAxisTypeIsFixedPoint(type);

       },

       "Fixed point values are real numbers divided by a scale.");


   //===-------------------------------------------------------------------===//

   // UniformQuantizedSubChannelType

   //===-------------------------------------------------------------------===//

   auto uniformQuantizedSubChannelType = mlir_type_subclass(

       m, "UniformQuantizedSubChannelType",

       mlirTypeIsAUniformQuantizedSubChannelType, quantizedType.get_class());

   uniformQuantizedSubChannelType.def_classmethod(

       "get",

       [](nb::object cls, unsigned flags, MlirType storageType,

          MlirType expressedType, MlirAttribute scales, MlirAttribute zeroPoints,

          std::vector<int32_t> quantizedDimensions,

          std::vector<int64_t> blockSizes, int64_t storageTypeMin,

          int64_t storageTypeMax) {

         return cls(mlirUniformQuantizedSubChannelTypeGet(

             flags, storageType, expressedType, scales, zeroPoints,

             static_cast<intptr_t>(blockSizes.size()),

             quantizedDimensions.data(), blockSizes.data(), storageTypeMin,

             storageTypeMax));

       },

       "Gets an instance of UniformQuantizedSubChannel in the same context as "

       "the provided storage type.",

       nb::arg("cls"), nb::arg("flags"), nb::arg("storage_type"),

       nb::arg("expressed_type"), nb::arg("scales"), nb::arg("zero_points"),

       nb::arg("quantized_dimensions"), nb::arg("block_sizes"),

       nb::arg("storage_type_min"), nb::arg("storage_type_max"));

   uniformQuantizedSubChannelType.def_property_readonly(

       "quantized_dimensions",

       [](MlirType type) {

         intptr_t nDim =

             mlirUniformQuantizedSubChannelTypeGetNumBlockSizes(type);

         std::vector<int32_t> quantizedDimensions;

         quantizedDimensions.reserve(nDim);

         for (intptr_t i = 0; i < nDim; ++i) {

           quantizedDimensions.push_back(

               mlirUniformQuantizedSubChannelTypeGetQuantizedDimension(type, i));

         }

         return quantizedDimensions;

       },

       "Gets the quantized dimensions. Each element in the returned list "

       "represents an axis of the quantized data tensor that has a specified "

       "block size. The order of elements corresponds to the order of block "

       "sizes returned by 'block_sizes' method. It means that the data tensor "

       "is quantized along the i-th dimension in the returned list using the "

       "i-th block size from block_sizes method.");

   uniformQuantizedSubChannelType.def_property_readonly(

       "block_sizes",

       [](MlirType type) {

         intptr_t nDim =

             mlirUniformQuantizedSubChannelTypeGetNumBlockSizes(type);

         std::vector<int64_t> blockSizes;

         blockSizes.reserve(nDim);

         for (intptr_t i = 0; i < nDim; ++i) {

           blockSizes.push_back(

               mlirUniformQuantizedSubChannelTypeGetBlockSize(type, i));

         }

         return blockSizes;

       },

       "Gets the block sizes for the quantized dimensions. The i-th element in "

       "the returned list corresponds to the block size for the i-th dimension "

       "in the list returned by quantized_dimensions method.");

   uniformQuantizedSubChannelType.def_property_readonly(

       "scales",

       [](MlirType type) -> MlirAttribute {

         return mlirUniformQuantizedSubChannelTypeGetScales(type);

       },

       "The scales of the quantized type.");

   uniformQuantizedSubChannelType.def_property_readonly(

       "zero_points",

       [](MlirType type) -> MlirAttribute {

         return mlirUniformQuantizedSubChannelTypeGetZeroPoints(type);

       },

       "The zero points of the quantized type.");


   //===-------------------------------------------------------------------===//

   // CalibratedQuantizedType

   //===-------------------------------------------------------------------===//


   auto calibratedQuantizedType = mlir_type_subclass(

       m, "CalibratedQuantizedType", mlirTypeIsACalibratedQuantizedType,

       quantizedType.get_class());

   calibratedQuantizedType.def_classmethod(

       "get",

       [](nb::object cls, MlirType expressedType, double min, double max) {

         return cls(mlirCalibratedQuantizedTypeGet(expressedType, min, max));

       },

       "Gets an instance of CalibratedQuantizedType in the same context as the "

       "provided expressed type.",

       nb::arg("cls"), nb::arg("expressed_type"), nb::arg("min"),

       nb::arg("max"));

   calibratedQuantizedType.def_property_readonly("min", [](MlirType type) {

     return mlirCalibratedQuantizedTypeGetMin(type);

   });

   calibratedQuantizedType.def_property_readonly("max", [](MlirType type) {

     return mlirCalibratedQuantizedTypeGetMax(type);

   });

 }


 NB_MODULE(_mlirDialectsQuant, m) {

   m.doc() = "MLIR Quantization dialect";


   populateDialectQuantSubmodule(m);

 }

populateDialectQuantSubmodule
static void populateDialectQuantSubmodule(const nb::module_ &m)
Definition: DialectQuant.cpp:23

NB_MODULE
NB_MODULE(_mlirDialectsQuant, m)
Definition: DialectQuant.cpp:385

NanobindAdaptors.h

Nanobind.h

max
static Value max(ImplicitLocOpBuilder &builder, Value value, Value bound)
Definition: PolynomialApproximation.cpp:212

min
static Value min(ImplicitLocOpBuilder &builder, Value value, Value bound)
Definition: PolynomialApproximation.cpp:204

mlir::python::nanobind_adaptors::mlir_type_subclass
Creates a custom subclass of mlir.ir.Type, implementing a casting constructor and type checking metho...
Definition: NanobindAdaptors.h:529

BuiltinAttributes.h

Quant.h

mlirUniformQuantizedPerAxisTypeGetNumDims
MLIR_CAPI_EXPORTED intptr_t mlirUniformQuantizedPerAxisTypeGetNumDims(MlirType type)
Returns the number of axes in the given quantized per-axis type.
Definition: Quant.cpp:172

mlirTypeIsACalibratedQuantizedType
MLIR_CAPI_EXPORTED bool mlirTypeIsACalibratedQuantizedType(MlirType type)
Returns true if the given type is a CalibratedQuantizedType.
Definition: Quant.cpp:257

mlirQuantizedTypeGetDefaultMaximumForInteger
MLIR_CAPI_EXPORTED int64_t mlirQuantizedTypeGetDefaultMaximumForInteger(bool isSigned, unsigned integralWidth)
Returns the maximum possible value stored by a quantized type.
Definition: Quant.cpp:37

mlirUniformQuantizedTypeIsFixedPoint
MLIR_CAPI_EXPORTED bool mlirUniformQuantizedTypeIsFixedPoint(MlirType type)
Returns true if the given uniform quantized type is fixed-point.
Definition: Quant.cpp:149

mlirUniformQuantizedSubChannelTypeGetZeroPoints
MLIR_CAPI_EXPORTED MlirAttribute mlirUniformQuantizedSubChannelTypeGetZeroPoints(MlirType type)
Returns the zero-points of the quantized type.
Definition: Quant.cpp:248

mlirQuantizedTypeGetStorageTypeMin
MLIR_CAPI_EXPORTED int64_t mlirQuantizedTypeGetStorageTypeMin(MlirType type)
Returns the minimum value that the storage type of the given quantized type can take.
Definition: Quant.cpp:59

mlirTypeIsAUniformQuantizedType
MLIR_CAPI_EXPORTED bool mlirTypeIsAUniformQuantizedType(MlirType type)
Returns true if the given type is a UniformQuantizedType.
Definition: Quant.cpp:128

mlirTypeIsAQuantizedType
MLIR_CAPI_EXPORTED bool mlirTypeIsAQuantizedType(MlirType type)
Returns true if the given type is a quantization dialect type.
Definition: Quant.cpp:23

mlirUniformQuantizedPerAxisTypeGetScale
MLIR_CAPI_EXPORTED double mlirUniformQuantizedPerAxisTypeGetScale(MlirType type, intptr_t pos)
Returns pos-th scale of the given quantized per-axis type.
Definition: Quant.cpp:178

mlirUniformQuantizedSubChannelTypeGetScales
MLIR_CAPI_EXPORTED MlirAttribute mlirUniformQuantizedSubChannelTypeGetScales(MlirType type)
Returns the scales of the quantized type.
Definition: Quant.cpp:243

mlirUniformQuantizedTypeGetZeroPoint
MLIR_CAPI_EXPORTED int64_t mlirUniformQuantizedTypeGetZeroPoint(MlirType type)
Returns the zero point of the given uniform quantized type.
Definition: Quant.cpp:145

mlirUniformQuantizedPerAxisTypeIsFixedPoint
MLIR_CAPI_EXPORTED bool mlirUniformQuantizedPerAxisTypeIsFixedPoint(MlirType type)
Returns true if the given uniform quantized per-axis type is fixed-point.
Definition: Quant.cpp:194

mlirUniformQuantizedSubChannelTypeGetBlockSize
MLIR_CAPI_EXPORTED int64_t mlirUniformQuantizedSubChannelTypeGetBlockSize(MlirType type, intptr_t pos)
Returns the block size at the given position.
Definition: Quant.cpp:237

mlirQuantizedTypeGetStorageTypeMax
MLIR_CAPI_EXPORTED int64_t mlirQuantizedTypeGetStorageTypeMax(MlirType type)
Returns the maximum value that the storage type of the given quantized type can take.
Definition: Quant.cpp:63

mlirCalibratedQuantizedTypeGetMax
MLIR_CAPI_EXPORTED double mlirCalibratedQuantizedTypeGetMax(MlirType type)
Returns the max value of the given calibrated quantized type.
Definition: Quant.cpp:271

mlirCalibratedQuantizedTypeGet
MLIR_CAPI_EXPORTED MlirType mlirCalibratedQuantizedTypeGet(MlirType expressedType, double min, double max)
Creates an instance of CalibratedQuantizedType with the given parameters in the same context as expre...
Definition: Quant.cpp:261

mlirQuantizedTypeIsSigned
MLIR_CAPI_EXPORTED bool mlirQuantizedTypeIsSigned(MlirType type)
Returns true if the given type is signed, false otherwise.
Definition: Quant.cpp:51

mlirUniformQuantizedSubChannelTypeGetNumBlockSizes
MLIR_CAPI_EXPORTED intptr_t mlirUniformQuantizedSubChannelTypeGetNumBlockSizes(MlirType type)
Returns the number of block sizes provided in type.
Definition: Quant.cpp:225

mlirUniformQuantizedPerAxisTypeGetZeroPoint
MLIR_CAPI_EXPORTED int64_t mlirUniformQuantizedPerAxisTypeGetZeroPoint(MlirType type, intptr_t pos)
Returns pos-th zero point of the given quantized per-axis type.
Definition: Quant.cpp:183

mlirUniformQuantizedPerAxisTypeGetQuantizedDimension
MLIR_CAPI_EXPORTED int32_t mlirUniformQuantizedPerAxisTypeGetQuantizedDimension(MlirType type)
Returns the index of the quantized dimension in the given quantized per-axis type.
Definition: Quant.cpp:189

mlirQuantizedTypeCastToExpressedType
MLIR_CAPI_EXPORTED MlirType mlirQuantizedTypeCastToExpressedType(MlirType type)
Casts from a type based on a quantized type to a corresponding typed based on the expressed type.
Definition: Quant.cpp:98

mlirQuantizedTypeGetExpressedType
MLIR_CAPI_EXPORTED MlirType mlirQuantizedTypeGetExpressedType(MlirType type)
Gets the original type approximated by the given quantized type.
Definition: Quant.cpp:43

mlirQuantizedTypeGetStorageTypeIntegralWidth
MLIR_CAPI_EXPORTED unsigned mlirQuantizedTypeGetStorageTypeIntegralWidth(MlirType type)
Returns the integral bitwidth that the storage type of the given quantized type can represent exactly...
Definition: Quant.cpp:67

mlirAnyQuantizedTypeGet
MLIR_CAPI_EXPORTED MlirType mlirAnyQuantizedTypeGet(unsigned flags, MlirType storageType, MlirType expressedType, int64_t storageTypeMin, int64_t storageTypeMax)
Creates an instance of AnyQuantizedType with the given parameters in the same context as storageType ...
Definition: Quant.cpp:116

mlirQuantizedTypeCastToStorageType
MLIR_CAPI_EXPORTED MlirType mlirQuantizedTypeCastToStorageType(MlirType type)
Casts from a type based on a quantized type to a corresponding typed based on the storage type.
Definition: Quant.cpp:87

mlirQuantizedTypeGetStorageType
MLIR_CAPI_EXPORTED MlirType mlirQuantizedTypeGetStorageType(MlirType type)
Returns the underlying type used to store the values.
Definition: Quant.cpp:55

mlirUniformQuantizedSubChannelTypeGetQuantizedDimension
MLIR_CAPI_EXPORTED int32_t mlirUniformQuantizedSubChannelTypeGetQuantizedDimension(MlirType type, intptr_t pos)
Returns the quantized dimension at the given position.
Definition: Quant.cpp:231

mlirQuantizedTypeCastFromExpressedType
MLIR_CAPI_EXPORTED MlirType mlirQuantizedTypeCastFromExpressedType(MlirType type, MlirType candidate)
Casts from a type based on the expressed type of the given type to a corresponding type based on the ...
Definition: Quant.cpp:92

mlirTypeIsAUniformQuantizedPerAxisType
MLIR_CAPI_EXPORTED bool mlirTypeIsAUniformQuantizedPerAxisType(MlirType type)
Returns true if the given type is a UniformQuantizedPerAxisType.
Definition: Quant.cpp:157

mlirQuantizedTypeGetQuantizedElementType
MLIR_CAPI_EXPORTED MlirType mlirQuantizedTypeGetQuantizedElementType(MlirType type)
Returns the element type of the given quantized type as another quantized type.
Definition: Quant.cpp:77

mlirTypeIsAAnyQuantizedType
MLIR_CAPI_EXPORTED bool mlirTypeIsAAnyQuantizedType(MlirType type)
Returns true if the given type is an AnyQuantizedType.
Definition: Quant.cpp:112

mlirQuantizedTypeCastExpressedToStorageType
MLIR_CAPI_EXPORTED MlirType mlirQuantizedTypeCastExpressedToStorageType(MlirType type, MlirType candidate)
Casts from a type based on the expressed type of the given quantized type to equivalent type based on...
Definition: Quant.cpp:102

mlirQuantizedTypeCastFromStorageType
MLIR_CAPI_EXPORTED MlirType mlirQuantizedTypeCastFromStorageType(MlirType type, MlirType candidate)
Casts from a type based on the storage type of the given type to a corresponding type based on the gi...
Definition: Quant.cpp:81

mlirQuantizedTypeGetSignedFlag
MLIR_CAPI_EXPORTED unsigned mlirQuantizedTypeGetSignedFlag(void)
Returns the bit flag used to indicate signedness of a quantized type.
Definition: Quant.cpp:27

mlirQuantizedTypeGetDefaultMinimumForInteger
MLIR_CAPI_EXPORTED int64_t mlirQuantizedTypeGetDefaultMinimumForInteger(bool isSigned, unsigned integralWidth)
Returns the minimum possible value stored by a quantized type.
Definition: Quant.cpp:31

mlirCalibratedQuantizedTypeGetMin
MLIR_CAPI_EXPORTED double mlirCalibratedQuantizedTypeGetMin(MlirType type)
Returns the min value of the given calibrated quantized type.
Definition: Quant.cpp:267

mlirQuantizedTypeGetFlags
MLIR_CAPI_EXPORTED unsigned mlirQuantizedTypeGetFlags(MlirType type)
Gets the flags associated with the given quantized type.
Definition: Quant.cpp:47

mlirUniformQuantizedPerAxisTypeGet
MLIR_CAPI_EXPORTED MlirType mlirUniformQuantizedPerAxisTypeGet(unsigned flags, MlirType storageType, MlirType expressedType, intptr_t nDims, double *scales, int64_t *zeroPoints, int32_t quantizedDimension, int64_t storageTypeMin, int64_t storageTypeMax)
Creates an instance of UniformQuantizedPerAxisType with the given parameters in the same context as s...
Definition: Quant.cpp:161

mlirUniformQuantizedSubChannelTypeGet
MLIR_CAPI_EXPORTED MlirType mlirUniformQuantizedSubChannelTypeGet(unsigned flags, MlirType storageType, MlirType expressedType, MlirAttribute scalesAttr, MlirAttribute zeroPointsAttr, intptr_t blockSizeInfoLength, int32_t *quantizedDimensions, int64_t *blockSizes, int64_t storageTypeMin, int64_t storageTypeMax)
Creates a UniformQuantizedSubChannelType with the given parameters.
Definition: Quant.cpp:206

mlirQuantizedTypeIsCompatibleExpressedType
MLIR_CAPI_EXPORTED bool mlirQuantizedTypeIsCompatibleExpressedType(MlirType type, MlirType candidate)
Returns true if the candidate type is compatible with the given quantized type.
Definition: Quant.cpp:71

mlirTypeIsAUniformQuantizedSubChannelType
MLIR_CAPI_EXPORTED bool mlirTypeIsAUniformQuantizedSubChannelType(MlirType type)
Returns true if the given type is a UniformQuantizedSubChannel.
Definition: Quant.cpp:202

mlirUniformQuantizedTypeGetScale
MLIR_CAPI_EXPORTED double mlirUniformQuantizedTypeGetScale(MlirType type)
Returns the scale of the given uniform quantized type.
Definition: Quant.cpp:141

mlirUniformQuantizedTypeGet
MLIR_CAPI_EXPORTED MlirType mlirUniformQuantizedTypeGet(unsigned flags, MlirType storageType, MlirType expressedType, double scale, int64_t zeroPoint, int64_t storageTypeMin, int64_t storageTypeMax)
Creates an instance of UniformQuantizedType with the given parameters in the same context as storageT...
Definition: Quant.cpp:132

IR.h

mlirTypeIsNull
static bool mlirTypeIsNull(MlirType type)
Checks whether a type is null.
Definition: IR.h:1135

llvm
The OpAsmOpInterface, see OpAsmInterface.td for more details.
Definition: CallGraph.h:229

mlir::python::nanobind_adaptors
Definition: NanobindAdaptors.h:360

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

nanobind
Definition: NanobindAdaptors.h:35