QuantUtils.h source code [mlir/include/mlir/Dialect/Tosa/Utils/QuantUtils.h]

1	//===-- QuantUtils.h - TOSA numerical support declarations ------- C++ --===//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8	//
9	// Function declarations for TOSA numerical support functions and quantization
10	// attribute builders
11	//
12	//===----------------------------------------------------------------------===//
13
14	#ifndef MLIR_DIALECT_TOSA_UTILS_QUANTUTILS_H
15	#define MLIR_DIALECT_TOSA_UTILS_QUANTUTILS_H
16
17	#include "mlir/Dialect/Tosa/IR/TosaOps.h"
18
19	#include "mlir/Dialect/Quant/FakeQuantSupport.h"
20	#include "mlir/Dialect/Quant/UniformSupport.h"
21
22	namespace mlir {
23	namespace tosa {
24
25	//===----------------------------------------------------------------------===//
26	// Utility functions to support quantization handling in Tosa.
27	//===----------------------------------------------------------------------===//
28
29	/// From a scale value, computes multiplier and shift values
30	/// for 16 or 32-bit scale widths.
31	void computeMultiplierAndShift(double scale, int32_t &multiplier,
32	int32_t &shift, int32_t scaleWidth);
33
34	//// Builds ConvOpQuantizationAttr from input and weight.
35	ConvOpQuantizationAttr buildConvOpQuantizationAttr(OpBuilder &builder,
36	Value input, Value weight);
37
38	//// Builds MatMulOpQuantizationAttr for MatMul operations from A and B.
39	MatMulOpQuantizationAttr buildMatMulOpQuantizationAttr(OpBuilder &builder,
40	Value a, Value b);
41
42	//// Builds UnaryOpQuantizationAttr for unary operations from input values.
43	UnaryOpQuantizationAttr buildUnaryOpQuantizationAttr(OpBuilder &builder,
44	Value input,
45	Type outputRawType);
46
47	//// Builds PadOpQuantizationAttr for pad operations from input values.
48	PadOpQuantizationAttr buildPadOpQuantizationAttr(OpBuilder &builder,
49	Value input);
50
51	//// construct ConvOp output type with correct bitwidth based on input/weight
52	/// width.
53	Type buildConvOpResultTypeInfo(OpBuilder &builder, Type outputType, Value input,
54	Value weight);
55
56	/// Builds Tosa quantization attributes from min/max values.
57	Type buildQTypeFromMinMax(OpBuilder builder, Type inputDType, Attribute minAttr,
58	Attribute maxAttr, IntegerAttr quantBits,
59	int filterQuantDim, bool isSigned,
60	BoolAttr narrowRange);
61
62	/// Builds Tosa quantization attributes from min/max values.
63	TypeAttr buildQTypeAttrFromMinMax(OpBuilder builder, Type inputDType,
64	Attribute minAttr, Attribute maxAttr,
65	IntegerAttr quantBits, int filterQuantDim,
66	bool isSigned, BoolAttr narrowRange);
67
68	} // namespace tosa
69	} // namespace mlir
70
71	#endif // MLIR_DIALECT_TOSA_UTILS_QUANTUTILS_H
72

source code of mlir/include/mlir/Dialect/Tosa/Utils/QuantUtils.h