mlir/html/QuantTypes_8h_source.html

 //===- QuantTypes.h - Quantization Ops and Types ----------------*- C++ -*-===//
 //
 // Part of the MLIR Project, under the Apache License v2.0 with LLVM Exceptions.
 // See https://llvm.org/LICENSE.txt for license information.
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 //
 //===----------------------------------------------------------------------===//

 #ifndef MLIR_DIALECT_QUANTOPS_QUANT_TYPES_H_
 #define MLIR_DIALECT_QUANTOPS_QUANT_TYPES_H_

 #include "mlir/IR/Attributes.h"
 #include "mlir/IR/Builders.h"
 #include "mlir/IR/Dialect.h"
 #include "mlir/IR/OpDefinition.h"
 #include "mlir/IR/StandardTypes.h"
 #include "mlir/IR/Types.h"
 #include "llvm/Support/MathExtras.h"

 namespace mlir {
 namespace quant {

 class QuantizedIntegerType;

 namespace detail {

 struct QuantizedTypeStorage;
 struct AnyQuantizedTypeStorage;
 struct UniformQuantizedTypeStorage;
 struct UniformQuantizedPerAxisTypeStorage;

 } // namespace detail

 namespace QuantizationTypes {
 enum Kind {
   Any = Type::FIRST_QUANTIZATION_TYPE,
   UniformQuantized,
   UniformQuantizedPerAxis,
   LAST_USED_QUANTIZATION_TYPE = UniformQuantizedPerAxis,
 };
 } // namespace QuantizationTypes

 namespace QuantizationFlags {
 enum FlagValue {
   // Indicates that the storage type should be interpreted as a signed
   // integer. The default is to interpret it as an unsigned value.
   Signed = 1,
 };
 } // namespace QuantizationFlags

 class QuantizedType : public Type {
 public:
   using ImplType = detail::QuantizedTypeStorage;
   using Type::Type;

   static constexpr unsigned MaxStorageBits = 32;

   static LogicalResult
   verifyConstructionInvariants(Optional<Location> loc, MLIRContext *context,
                                unsigned flags, Type storageType,
                                Type expressedType, int64_t storageTypeMin,
                                int64_t storageTypeMax);

   static bool classof(Type type) {
     return type.getKind() >= Type::FIRST_QUANTIZATION_TYPE &&
            type.getKind() <= QuantizationTypes::LAST_USED_QUANTIZATION_TYPE;
   }

   static int64_t getDefaultMinimumForInteger(bool isSigned,
                                              unsigned integralWidth) {
     if (isSigned) {
       return llvm::minIntN(integralWidth);
     }
     return 0;
   }

   static int64_t getDefaultMaximumForInteger(bool isSigned,
                                              unsigned integralWidth) {
     if (isSigned) {
       return llvm::maxIntN(integralWidth);
     }
     return llvm::maxUIntN(integralWidth);
   }

   Type getExpressedType() const;

   unsigned getFlags() const;

   // Convenience helpers.
   bool isSigned() const {
     return (getFlags() & QuantizationFlags::Signed) ==
            QuantizationFlags::Signed;
   }

   Type getStorageType() const;

   int64_t getStorageTypeMin() const;

   int64_t getStorageTypeMax() const;

   unsigned getStorageTypeIntegralWidth() const;

   bool isCompatibleExpressedType(Type candidateExpressedType);

   static QuantizedType getQuantizedElementType(Type primitiveOrContainerType);

   Type castFromStorageType(Type candidateType);

   static Type castToStorageType(Type quantizedType);

   Type castFromExpressedType(Type candidateType);

   static Type castToExpressedType(Type quantizedType);

   Type castExpressedToStorageType(Type candidateType);

 private:
   using Type::isBF16;
   using Type::isF16;
   using Type::isF32;
   using Type::isF64;
   using Type::isIndex;
   using Type::isInteger;
 };

 class AnyQuantizedType
     : public Type::TypeBase<AnyQuantizedType, QuantizedType,
                             detail::AnyQuantizedTypeStorage> {
 public:
   using Base::Base;

   static bool kindof(unsigned kind) { return kind == QuantizationTypes::Any; }

   static AnyQuantizedType get(unsigned flags, Type storageType,
                               Type expressedType, int64_t storageTypeMin,
                               int64_t storageTypeMax);

   static AnyQuantizedType getChecked(unsigned flags, Type storageType,
                                      Type expressedType, int64_t storageTypeMin,
                                      int64_t storageTypeMax, Location location);

   static LogicalResult
   verifyConstructionInvariants(Optional<Location> loc, MLIRContext *context,
                                unsigned flags, Type storageType,
                                Type expressedType, int64_t storageTypeMin,
                                int64_t storageTypeMax);
 };

 class UniformQuantizedType
     : public Type::TypeBase<UniformQuantizedType, QuantizedType,
                             detail::UniformQuantizedTypeStorage> {
 public:
   using Base::Base;

   static UniformQuantizedType get(unsigned flags, Type storageType,
                                   Type expressedType, double scale,
                                   int64_t zeroPoint, int64_t storageTypeMin,
                                   int64_t storageTypeMax);

   static UniformQuantizedType
   getChecked(unsigned flags, Type storageType, Type expressedType, double scale,
              int64_t zeroPoint, int64_t storageTypeMin, int64_t storageTypeMax,
              Location location);

   static LogicalResult verifyConstructionInvariants(
       Optional<Location> loc, MLIRContext *context, unsigned flags,
       Type storageType, Type expressedType, double scale, int64_t zeroPoint,
       int64_t storageTypeMin, int64_t storageTypeMax);

   static bool kindof(unsigned kind) {
     return kind == QuantizationTypes::UniformQuantized;
   }

   double getScale() const;

   int64_t getZeroPoint() const;

   // Fixed point values are real numbers divided by a scale.
   // Currently, only signed storage types are treated as fixed point.
   // A fixed point value can be obtained from an affine value by subtracting
   // the zeroPoint.
   // In the future, this may be explicit versus implied by type and zeroPoint.
   bool isFixedPoint() const { return isSigned() && getZeroPoint() == 0; }
 };

 class UniformQuantizedPerAxisType
     : public Type::TypeBase<UniformQuantizedPerAxisType, QuantizedType,
                             detail::UniformQuantizedPerAxisTypeStorage> {
 public:
   using Base::Base;

   static UniformQuantizedPerAxisType
   get(unsigned flags, Type storageType, Type expressedType,
       ArrayRef<double> scales, ArrayRef<int64_t> zeroPoints,
       int32_t quantizedDimension, int64_t storageTypeMin,
       int64_t storageTypeMax);

   static UniformQuantizedPerAxisType
   getChecked(unsigned flags, Type storageType, Type expressedType,
              ArrayRef<double> scales, ArrayRef<int64_t> zeroPoints,
              int32_t quantizedDimension, int64_t storageTypeMin,
              int64_t storageTypeMax, Location location);

   static LogicalResult verifyConstructionInvariants(
       Optional<Location> loc, MLIRContext *context, unsigned flags,
       Type storageType, Type expressedType, ArrayRef<double> scales,
       ArrayRef<int64_t> zeroPoints, int32_t quantizedDimension,
       int64_t storageTypeMin, int64_t storageTypeMax);

   static bool kindof(unsigned kind) {
     return kind == QuantizationTypes::UniformQuantizedPerAxis;
   }

   ArrayRef<double> getScales() const;

   ArrayRef<int64_t> getZeroPoints() const;

   int32_t getQuantizedDimension() const;

   bool isFixedPoint() const {
     if (!isSigned())
       return false;
     return llvm::all_of(getZeroPoints(),
                         [](int64_t zeroPoint) { return zeroPoint != 0; });
   }
 };

 } // namespace quant
 } // namespace mlir

 #endif // MLIR_DIALECT_QUANTOPS_QUANT_TYPES_H_
mlir
Definition: InferTypeOpInterface.cpp:20

mlir::quant::QuantizationFlags::FlagValue
FlagValue
Definition: QuantTypes.h:45

mlir::quant::UniformQuantizedPerAxisType::kindof
static bool kindof(unsigned kind)
Support method to enable LLVM-style type casting.
Definition: QuantTypes.h:361

StandardTypes.h

Types.h

mlir::quant::detail::QuantizedTypeStorage
Definition: TypeDetail.h:23

mlir::quant::QuantizedType::getDefaultMinimumForInteger
static int64_t getDefaultMinimumForInteger(bool isSigned, unsigned integralWidth)
Definition: QuantTypes.h:82

mlir::quant::UniformQuantizedType
Definition: QuantTypes.h:270

mlir::quant::QuantizationTypes::Any
Definition: QuantTypes.h:36

llvm::Optional
Definition: LLVM.h:40

Attributes.h

mlir::Location
Definition: Location.h:52

mlir::Type::isIndex
bool isIndex()
Definition: StandardTypes.cpp:30

mlir::quant::UniformQuantizedType::kindof
static bool kindof(unsigned kind)
Support method to enable LLVM-style type casting.
Definition: QuantTypes.h:297

mlir::quant::QuantizationTypes::LAST_USED_QUANTIZATION_TYPE
Definition: QuantTypes.h:39

mlir::LogicalResult
Definition: LogicalResult.h:18

Builders.h

llvm::ArrayRef
Definition: LLVM.h:37

mlir::Type::getKind
unsigned getKind() const
Return the classification for this type.
Definition: Types.cpp:22

mlir::quant::UniformQuantizedPerAxisType::isFixedPoint
bool isFixedPoint() const
Definition: QuantTypes.h:391

mlir::quant::QuantizationFlags::Signed
Definition: QuantTypes.h:48

mlir::Type::isF32
bool isF32()
Definition: StandardTypes.cpp:27

mlir::quant::AnyQuantizedType
Definition: QuantTypes.h:209

mlir::Type::isBF16
bool isBF16()
Definition: StandardTypes.cpp:25

mlir::Type::Type
Type()
Definition: Types.h:111

mlir::quant::UniformQuantizedPerAxisType
Definition: QuantTypes.h:331

mlir::quant::QuantizationTypes::UniformQuantizedPerAxis
Definition: QuantTypes.h:38

mlir::quant::QuantizationTypes::UniformQuantized
Definition: QuantTypes.h:37

mlir::quant::QuantizedType::isSigned
bool isSigned() const
Definition: QuantTypes.h:117

mlir::Type
Definition: Types.h:84

OpDefinition.h

Dialect.h

mlir::quant::QuantizationTypes::Kind
Kind
Definition: QuantTypes.h:35

mlir::quant::QuantizedType::classof
static bool classof(Type type)
Support method to enable LLVM-style type casting.
Definition: QuantTypes.h:75

mlir::quant::QuantizedType
Definition: QuantTypes.h:60

mlir::detail::StorageUserBase
Definition: StorageUniquerSupport.h:30

mlir::MLIRContext
Definition: MLIRContext.h:34

mlir::Type::isInteger
bool isInteger(unsigned width)
Return true if this is an integer type with the specified width.
Definition: StandardTypes.cpp:33

mlir::Type::isF16
bool isF16()
Definition: StandardTypes.cpp:26

mlir::Type::isF64
bool isF64()
Definition: StandardTypes.cpp:28

mlir::quant::UniformQuantizedType::isFixedPoint
bool isFixedPoint() const
Definition: QuantTypes.h:314

mlir::quant::AnyQuantizedType::kindof
static bool kindof(unsigned kind)
Support method to enable LLVM-style type casting.
Definition: QuantTypes.h:216

mlir::quant::QuantizedType::getDefaultMaximumForInteger
static int64_t getDefaultMaximumForInteger(bool isSigned, unsigned integralWidth)
Definition: QuantTypes.h:92