doxygen/UniformSupport_8cpp_source.html

 //===- UniformSupport.cpp - Support utilities for uniform quant -----------===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//


 #include "mlir/Dialect/Quant/Utils/UniformSupport.h"

 #include "mlir/IR/BuiltinTypes.h"

 #include <numeric>


 using namespace mlir;

 using namespace mlir::quant;


 static bool isQuantizablePrimitiveType(Type inputType) {

   return isa<FloatType>(inputType);

 }


 ExpressedToQuantizedConverter

 ExpressedToQuantizedConverter::forInputType(Type inputType) {

   if (isa<TensorType, VectorType>(inputType)) {

     Type elementType = cast<ShapedType>(inputType).getElementType();

     if (!isQuantizablePrimitiveType(elementType))

       return ExpressedToQuantizedConverter{inputType, nullptr};

     return ExpressedToQuantizedConverter{inputType, elementType};

   }

   // Supported primitive type (which just is the expressed type).

   if (isQuantizablePrimitiveType(inputType))

     return ExpressedToQuantizedConverter{inputType, inputType};

   // Unsupported.

   return ExpressedToQuantizedConverter{inputType, nullptr};

 }


 Type ExpressedToQuantizedConverter::convert(QuantizedType elementalType) const {

   assert(expressedType && "convert() on unsupported conversion");

   if (auto tensorType = dyn_cast<RankedTensorType>(inputType))

     return RankedTensorType::get(tensorType.getShape(), elementalType);

   if (isa<UnrankedTensorType>(inputType))

     return UnrankedTensorType::get(elementalType);

   if (auto vectorType = dyn_cast<VectorType>(inputType))

     return VectorType::get(vectorType.getShape(), elementalType);


   // If the expressed types match, just use the new elemental type.

   if (elementalType.getExpressedType() == expressedType)

     return elementalType;

   // Unsupported.

   return nullptr;

 }


 ElementsAttr

 UniformQuantizedPerAxisValueConverter::convert(Attribute realValue) {

   if (auto attr = dyn_cast<DenseFPElementsAttr>(realValue)) {

     return convert(attr);

   }

   // TODO: handles sparse elements attribute

   return nullptr;

 }


 DenseElementsAttr

 UniformQuantizedPerAxisValueConverter::convert(DenseFPElementsAttr attr) {

   // Creates the converter for each chunk. Normally the size of the

   // quantization dim is 3, so we can cache all the converters.

   ShapedType type = attr.getType();

   size_t dimSize = type.getDimSize(quantizationDim);

   if (dimSize != scales.size()) {

     return {};

   }

   SmallVector<UniformQuantizedValueConverter, 4> converters;

   converters.reserve(dimSize);

   for (int i = 0, e = dimSize; i != e; ++i) {

     converters.push_back(getPerChunkConverter(i));

   }


   // Scan the elements of the dense elements attributes and quantize them by

   // using the right quantization parameters.

   int64_t flattenIndex = 0;

   auto shape = type.getShape();

   int64_t chunkSize =

       std::accumulate(std::next(shape.begin(), quantizationDim + 1),

                       shape.end(), 1, std::multiplies<int64_t>());

   Type newElementType = IntegerType::get(attr.getContext(), storageBitWidth);

   return attr.mapValues(newElementType, [&](const APFloat &old) {

     int chunkIndex = (flattenIndex++) / chunkSize;

     return converters[chunkIndex % dimSize].quantizeFloatToInt(old);

   });

 }

isQuantizablePrimitiveType
static bool isQuantizablePrimitiveType(Type inputType)
Definition: UniformSupport.cpp:16

UniformSupport.h

llvm::SmallVector
Definition: LLVM.h:72

mlir::Attribute
Attributes are known-constant values of operations.
Definition: Attributes.h:25

mlir::DenseElementsAttr
An attribute that represents a reference to a dense vector or tensor object.
Definition: BuiltinAttributes.h:82

mlir::DenseFPElementsAttr
An attribute that represents a reference to a dense float vector or tensor object.
Definition: BuiltinAttributes.h:913

mlir::DenseFPElementsAttr::mapValues
DenseElementsAttr mapValues(Type newElementType, function_ref< APInt(const APFloat &)> mapping) const
Generates a new DenseElementsAttr by mapping each value attribute, and constructing the DenseElements...
Definition: BuiltinAttributes.cpp:1506

mlir::Type
Instances of the Type class are uniqued, have an immutable identifier and an optional mutable compone...
Definition: Types.h:74

mlir::quant::QuantizedType
Base class for all quantized types known to this dialect.
Definition: QuantTypes.h:50

mlir::quant::QuantizedType::getExpressedType
Type getExpressedType() const
Gets the original expressed type that this quantized type approximates.
Definition: QuantTypes.cpp:109

mlir::quant::UniformQuantizedPerAxisValueConverter::convert
ElementsAttr convert(Attribute realValue)
Quantize an Attribute by the quantization parameters.
Definition: UniformSupport.cpp:52

BuiltinTypes.h

mlir::quant
Definition: Quant.h:25

mlir
Include the generated interface declarations.
Definition: LocalAliasAnalysis.h:20

mlir::get
auto get(MLIRContext *context, Ts &&...params)
Helper method that injects context only if needed, this helps unify some of the attribute constructio...
Definition: BytecodeImplementation.h:509

mlir::quant::ExpressedToQuantizedConverter
Performs type conversion from an arbitrary input type to a type that is expressed by a QuantizedType.
Definition: UniformSupport.h:34

mlir::quant::ExpressedToQuantizedConverter::forInputType
static ExpressedToQuantizedConverter forInputType(Type inputType)
Creates a converter for the given input type.
Definition: UniformSupport.cpp:21

mlir::quant::ExpressedToQuantizedConverter::inputType
const Type inputType
The input type that is being converted from.
Definition: UniformSupport.h:47

mlir::quant::ExpressedToQuantizedConverter::convert
Type convert(QuantizedType elementalType) const
Converts the inputType to be based on the given elemental type, returning the new type (or nullptr an...
Definition: UniformSupport.cpp:35

mlir::quant::ExpressedToQuantizedConverter::expressedType
const Type expressedType
Supported, elemental expressed type (i.e.
Definition: UniformSupport.h:51