Blame - arm_compute/core/QuantizationInfo.h - ml/ComputeLibrary

blob: 471b8c57aba6100f8962e270659ebd252968fd57 [file] [log] [blame]

Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	1	/*
Pablo Marquez Tello	9c8f9a9	2023-06-08 12:00:29 +0100	[diff] [blame]	2	* Copyright (c) 2019-2023 Arm Limited.
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	3	*
				4	* SPDX-License-Identifier: MIT
				5	*
				6	* Permission is hereby granted, free of charge, to any person obtaining a copy
				7	* of this software and associated documentation files (the "Software"), to
				8	* deal in the Software without restriction, including without limitation the
				9	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
				10	* sell copies of the Software, and to permit persons to whom the Software is
				11	* furnished to do so, subject to the following conditions:
				12	*
				13	* The above copyright notice and this permission notice shall be included in all
				14	* copies or substantial portions of the Software.
				15	*
				16	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				17	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				18	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
				19	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				20	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
				21	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
				22	* SOFTWARE.
				23	*/
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	24	#ifndef ARM_COMPUTE_QUANTIZATION_INFO_H
				25	#define ARM_COMPUTE_QUANTIZATION_INFO_H
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	26
Giorgio Arena	433ea49	2021-05-26 15:32:50 +0100	[diff] [blame]	27	#include "arm_compute/core/Rounding.h"
Matthew Bentham	7d9a78e	2023-05-31 13:18:33 +0000	[diff] [blame]	28	#include "arm_compute/core/utils/misc/Utility.h"
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	29
Giorgio Arena	433ea49	2021-05-26 15:32:50 +0100	[diff] [blame]	30	#include "support/ToolchainSupport.h"
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	31
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	32	#include <vector>
				33
				34	namespace arm_compute
				35	{
Michalis Spyrou	8d4d1b8	2019-11-28 11:31:23 +0000	[diff] [blame]	36	using qasymm8_signed_t = int8_t; /*< 8 bit signed quantized asymmetric scalar value /
				37	using qasymm8_t = uint8_t; /*< 8 bit quantized asymmetric scalar value /
				38	using qsymm16_t = int16_t; /*< 16 bit quantized symmetric scalar value /
				39	using qasymm16_t = uint16_t; /*< 16 bit quantized asymmetric scalar value /
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	40
				41	/** Quantization info when assuming per layer quantization */
				42	struct UniformQuantizationInfo
				43	{
				44	/** Default constructor */
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	45	UniformQuantizationInfo() : scale(0.f), offset(0)
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	46	{
				47	}
				48	/** Constructor
				49	*
				50	* @param[in] scale Quantization scale
				51	* @param[in] offset Quantization offset
				52	*/
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	53	UniformQuantizationInfo(float scale, int32_t offset) : scale(scale), offset(offset)
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	54	{
				55	}
				56	/** Checks if the scale and offset are both zero */
				57	bool empty() const
				58	{
				59	return (scale == 0) && (offset == 0);
				60	}
				61
				62	float scale;
				63	int32_t offset;
				64	};
				65
				66	/** Quantization information */
Georgios Pinitas	3d13af8	2019-06-04 13:04:16 +0100	[diff] [blame]	67	class QuantizationInfo
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	68	{
Georgios Pinitas	3d13af8	2019-06-04 13:04:16 +0100	[diff] [blame]	69	public:
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	70	/** Default constructor */
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	71	QuantizationInfo() noexcept : _scale(), _offset()
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	72	{
				73	}
				74	/** Construct quantization info.
				75	*
				76	* @note Used for symmetric quantization
				77	*
				78	* @param[in] scale Scale.
				79	*/
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	80	QuantizationInfo(float scale) : _scale(1, scale), _offset()
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	81	{
				82	}
				83	/** Construct quantization info.
				84	*
				85	* @note Used for asymmetric quantization
				86	*
				87	* @param[in] scale Scale.
				88	* @param[in] offset Offset.
				89	*/
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	90	QuantizationInfo(float scale, int offset) : _scale(1, scale), _offset(1, offset)
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	91	{
				92	}
				93	/** Construct quantization info.
				94	*
				95	* @note Used for symmetric per channel quantization
				96	*
				97	* @param[in] scale Scale.
				98	*/
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	99	QuantizationInfo(std::vector<float> scale) : _scale(scale), _offset()
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	100	{
				101	}
Michalis Spyrou	29a01c9	2019-08-22 11:44:04 +0100	[diff] [blame]	102	/** Construct quantization info.
				103	*
				104	* @note Used for asymmetric per channel quantization
				105	*
				106	* @param[in] scale Scale.
				107	* @param[in] offset Offset.
				108	*/
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	109	QuantizationInfo(std::vector<float> scale, std::vector<int32_t> offset) : _scale(scale), _offset(offset)
Michalis Spyrou	29a01c9	2019-08-22 11:44:04 +0100	[diff] [blame]	110	{
				111	}
Georgios Pinitas	3d13af8	2019-06-04 13:04:16 +0100	[diff] [blame]	112	/** Scale vector accessor
				113	*
				114	* @return A reference to quantization scale metadata
				115	*/
				116	const std::vector<float> &scale() const
				117	{
				118	return _scale;
				119	}
				120	/** Offset vector accessor
				121	*
				122	* @return A reference to quantization offset metadata
				123	*/
				124	const std::vector<int32_t> &offset() const
				125	{
				126	return _offset;
				127	}
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	128	/** Indicates whether this QuantizationInfo has valid settings or not
				129	*
				130	* @return True if the this has invalid settings.
				131	*/
				132	bool empty() const
				133	{
Georgios Pinitas	3d13af8	2019-06-04 13:04:16 +0100	[diff] [blame]	134	return _scale.empty() && _offset.empty();
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	135	}
				136	/** Return per layer quantization info
				137	*
				138	* @return Uniform quantization information in case of empty information zero is returned in the respective fields
				139	*/
				140	UniformQuantizationInfo uniform() const
				141	{
				142	UniformQuantizationInfo uqinfo;
Georgios Pinitas	3d13af8	2019-06-04 13:04:16 +0100	[diff] [blame]	143	uqinfo.scale = _scale.empty() ? 0 : _scale[0];
				144	uqinfo.offset = _offset.empty() ? 0 : _offset[0];
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	145
				146	return uqinfo;
				147	}
				148
Georgios Pinitas	3d13af8	2019-06-04 13:04:16 +0100	[diff] [blame]	149	private:
				150	std::vector<float> _scale; /*< Vector containing scaling factors /
				151	std::vector<int32_t> _offset; /*< Vector containing zero offsets /
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	152	};
				153
				154	/** Check whether two quantization info are equal.
				155	*
				156	* @param[in] lhs RHS quantization info.
				157	* @param[in] rhs LHS quantization info.
				158	*
				159	* @return True if the given quantization info is the same.
				160	*/
				161	inline bool operator==(const QuantizationInfo &lhs, const QuantizationInfo &rhs)
				162	{
Georgios Pinitas	3d13af8	2019-06-04 13:04:16 +0100	[diff] [blame]	163	return (lhs.scale() == rhs.scale()) && (lhs.offset() == rhs.offset());
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	164	}
				165
				166	/** Check whether two quantization info are not equal.
				167	*
				168	* @param[in] lhs RHS quantization info.
				169	* @param[in] rhs LHS quantization info.
				170	*
				171	* @return True if the given quantization info is the same.
				172	*/
				173	inline bool operator!=(const QuantizationInfo &lhs, const QuantizationInfo &rhs)
				174	{
				175	return !(operator==(lhs, rhs));
				176	}
				177
				178	/** Check whether two quantization info are equal.
				179	*
				180	* @param[in] lhs RHS quantization info.
				181	* @param[in] rhs LHS quantization info.
				182	*
				183	* @return True if the given quantization info is the same.
				184	*/
				185	inline bool operator==(const UniformQuantizationInfo &lhs, const UniformQuantizationInfo &rhs)
				186	{
				187	return (lhs.scale == rhs.scale) && (lhs.offset == rhs.offset);
				188	}
				189
				190	/** Check whether two quantization info are not equal.
				191	*
				192	* @param[in] lhs RHS quantization info.
				193	* @param[in] rhs LHS quantization info.
				194	*
				195	* @return True if the given quantization info is the same.
				196	*/
				197	inline bool operator!=(const UniformQuantizationInfo &lhs, const UniformQuantizationInfo &rhs)
				198	{
				199	return !(operator==(lhs, rhs));
				200	}
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	201	template <typename QUANTIZED_TYPE = uint8_t>
				202	struct Qasymm8QuantizationHelper
				203	{
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	204	static_assert(std::is_same<QUANTIZED_TYPE, uint8_t>::value \|\| std::is_same<QUANTIZED_TYPE, int8_t>::value,
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	205	"quantized type should be either uint8_t or int8_t.");
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	206
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	207	/** Quantize a value given a 8-bit asymmetric quantization scheme
				208	*
Giorgio Arena	433ea49	2021-05-26 15:32:50 +0100	[diff] [blame]	209	* @param[in] value Value to quantize
				210	* @param[in] qinfo Quantization information to use for quantizing
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	211	*
				212	* @return Quantized value
				213	*/
Giorgio Arena	433ea49	2021-05-26 15:32:50 +0100	[diff] [blame]	214	static inline QUANTIZED_TYPE quantize(float value, const UniformQuantizationInfo &qinfo)
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	215	{
				216	ARM_COMPUTE_ERROR_ON(qinfo.scale == 0);
Giorgio Arena	433ea49	2021-05-26 15:32:50 +0100	[diff] [blame]	217	const int quantized = support::cpp11::lround(value / qinfo.scale) + qinfo.offset;
				218	return static_cast<QUANTIZED_TYPE>(arm_compute::utility::clamp<decltype(quantized), QUANTIZED_TYPE>(quantized));
				219	}
				220
				221	/** Quantize a value given a 8-bit asymmetric quantization scheme using a specific rounding policy
				222	*
				223	* @param[in] value Value to quantize
				224	* @param[in] qinfo Quantization information to use for quantizing
				225	* @param[in] rounding_policy Rounding policy to use
				226	*
				227	* @return Quantized value
				228	*/
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	229	static inline QUANTIZED_TYPE
				230	quantize(float value, const UniformQuantizationInfo &qinfo, RoundingPolicy rounding_policy)
Giorgio Arena	433ea49	2021-05-26 15:32:50 +0100	[diff] [blame]	231	{
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	232	if (rounding_policy == RoundingPolicy::TO_NEAREST_UP)
Giorgio Arena	433ea49	2021-05-26 15:32:50 +0100	[diff] [blame]	233	{
				234	return quantize(value, qinfo);
				235	}
				236
				237	ARM_COMPUTE_ERROR_ON(qinfo.scale == 0);
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	238	const int quantized = arm_compute::round(value / qinfo.scale, rounding_policy) + qinfo.offset;
				239	return static_cast<QUANTIZED_TYPE>(arm_compute::utility::clamp<decltype(quantized), QUANTIZED_TYPE>(quantized));
				240	}
				241
				242	/** Quantize a value given a 8-bit asymmetric quantization scheme
				243	*
				244	* @param[in] value Value to quantize
				245	* @param[in] qinfo Quantization information to use for quantizing
				246	* @param[in] rounding_policy (Optional) Rounding policy to use. Default: nearest up
				247	*
				248	* @return Quantized value
				249	*/
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	250	static inline QUANTIZED_TYPE
				251	quantize(float value, const QuantizationInfo &qinfo, RoundingPolicy rounding_policy = RoundingPolicy::TO_NEAREST_UP)
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	252	{
				253	const UniformQuantizationInfo uqinfo = qinfo.uniform();
				254	ARM_COMPUTE_ERROR_ON(uqinfo.scale == 0);
				255	const int quantized = arm_compute::round(value / uqinfo.scale, rounding_policy) + uqinfo.offset;
				256	return static_cast<QUANTIZED_TYPE>(arm_compute::utility::clamp<decltype(quantized), QUANTIZED_TYPE>(quantized));
				257	}
				258
				259	/** Dequantize a value given a 8-bit asymmetric quantization scheme
				260	*
				261	* @param[in] value Value to dequantize
				262	* @param[in] qinfo Quantization information to use for dequantizing
				263	*
				264	* @return Dequantized value
				265	*/
				266	static inline float dequantize(QUANTIZED_TYPE value, const UniformQuantizationInfo &qinfo)
				267	{
				268	return (static_cast<int>(value) - qinfo.offset) * qinfo.scale;
				269	}
				270
				271	/** Dequantize a value given a 8-bit asymmetric quantization scheme
				272	*
				273	* @param[in] value Value to dequantize
				274	* @param[in] qinfo Quantization information to use for dequantizing
				275	*
				276	* @return Dequantized value
				277	*/
				278	static inline float dequantize(QUANTIZED_TYPE value, const QuantizationInfo &qinfo)
				279	{
				280	const UniformQuantizationInfo uqinfo = qinfo.uniform();
				281	return (static_cast<int>(value) - uqinfo.offset) * uqinfo.scale;
				282	}
				283	};
				284
				285	/** Quantize a value given an unsigned 8-bit asymmetric quantization scheme
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	286	*
				287	* @param[in] value Value to quantize
				288	* @param[in] qinfo Quantization information to use for quantizing
				289	* @param[in] rounding_policy (Optional) Rounding policy to use. Default: nearest up
				290	*
				291	* @return Quantized value
				292	*/
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	293	template <typename INFO_TYPE>
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	294	inline uint8_t
				295	quantize_qasymm8(float value, const INFO_TYPE &qinfo, RoundingPolicy rounding_policy = RoundingPolicy::TO_NEAREST_UP)
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	296	{
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	297	return Qasymm8QuantizationHelper<uint8_t>::quantize(value, qinfo, rounding_policy);
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	298	}
				299
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	300	/** Quantize a value given a signed 8-bit asymmetric quantization scheme
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	301	*
				302	* @param[in] value Value to quantize
				303	* @param[in] qinfo Quantization information to use for quantizing
				304	* @param[in] rounding_policy (Optional) Rounding policy to use. Default: nearest up
				305	*
				306	* @return Quantized value
				307	*/
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	308	template <typename INFO_TYPE>
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	309	inline int8_t quantize_qasymm8_signed(float value,
				310	const INFO_TYPE &qinfo,
				311	RoundingPolicy rounding_policy = RoundingPolicy::TO_NEAREST_UP)
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	312	{
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	313	return Qasymm8QuantizationHelper<int8_t>::quantize(value, qinfo, rounding_policy);
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	314	}
				315
Michele Di Giorgio	35ea9a7	2019-08-23 12:02:06 +0100	[diff] [blame]	316	/** Quantize a value given a 8-bit symmetric quantization scheme
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	317	*
				318	* @param[in] value Value to quantize
				319	* @param[in] qinfo Quantization information to use for quantizing
				320	*
				321	* @return Quantized value
				322	*/
				323	inline int8_t quantize_qsymm8(float value, const QuantizationInfo &qinfo)
				324	{
				325	int quantized = arm_compute::round(value / qinfo.uniform().scale, RoundingPolicy::TO_NEAREST_UP);
				326	quantized = std::max(-128, std::min(quantized, 127));
				327	return quantized;
				328	}
				329
Georgios Pinitas	dbdea0d	2019-10-16 19:21:40 +0100	[diff] [blame]	330	/** Quantize a value given a 8-bit symmetric per channel quantization scheme
				331	*
				332	* @param[in] value Value to quantize
				333	* @param[in] qinfo Quantization information to use for quantizing
				334	* @param[in] channel_id channel index into the scale vector of quantization info
				335	*
				336	* @return Quantized value
				337	*/
				338	inline int8_t quantize_qsymm8_per_channel(float value, const QuantizationInfo &qinfo, size_t channel_id = 0)
				339	{
				340	int quantized = arm_compute::round(value / qinfo.scale()[channel_id], RoundingPolicy::TO_NEAREST_UP);
				341	quantized = std::max(-128, std::min(quantized, 127));
				342	return quantized;
				343	}
				344
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	345	/** Dequantize a value given an unsigned 8-bit asymmetric quantization scheme
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	346	*
				347	* @param[in] value Value to dequantize
				348	* @param[in] qinfo Quantization information to use for dequantizing
				349	*
				350	* @return Dequantized value
				351	*/
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	352	template <typename INFO_TYPE>
				353	inline float dequantize_qasymm8(uint8_t value, const INFO_TYPE &qinfo)
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	354	{
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	355	return Qasymm8QuantizationHelper<uint8_t>::dequantize(value, qinfo);
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	356	}
				357
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	358	/** Dequantize a value given a signed 8-bit asymmetric quantization scheme
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	359	*
				360	* @param[in] value Value to dequantize
				361	* @param[in] qinfo Quantization information to use for dequantizing
				362	*
				363	* @return Dequantized value
				364	*/
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	365	template <typename INFO_TYPE>
				366	inline float dequantize_qasymm8_signed(int8_t value, const INFO_TYPE &qinfo)
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	367	{
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	368	return Qasymm8QuantizationHelper<int8_t>::dequantize(value, qinfo);
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	369	}
				370
Michele Di Giorgio	35ea9a7	2019-08-23 12:02:06 +0100	[diff] [blame]	371	/** Dequantize a value given an 8-bit asymmetric quantization scheme
Georgios Pinitas	3d13af8	2019-06-04 13:04:16 +0100	[diff] [blame]	372	*
				373	* @param[in] value Value to dequantize
				374	* @param[in] scale Scale to use for dequantization
				375	* @param[in] offset Zero-offset to use for dequantization
				376	*
				377	* @return Dequantized value
				378	*/
				379	inline float dequantize(uint8_t value, float scale, int32_t offset)
				380	{
				381	return (static_cast<int>(value) - offset) * scale;
				382	}
				383
Michele Di Giorgio	35ea9a7	2019-08-23 12:02:06 +0100	[diff] [blame]	384	/** Dequantize a value given a 8-bit symmetric quantization scheme
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	385	*
				386	* @param[in] value Value to dequantize
				387	* @param[in] qinfo Quantization information to use for dequantizing
				388	*
				389	* @return Dequantized value
				390	*/
Georgios Pinitas	3d13af8	2019-06-04 13:04:16 +0100	[diff] [blame]	391	inline float dequantize_qsymm8(int8_t value, const UniformQuantizationInfo &qinfo)
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	392	{
Georgios Pinitas	3d13af8	2019-06-04 13:04:16 +0100	[diff] [blame]	393	return value * qinfo.scale;
				394	}
				395
Michele Di Giorgio	35ea9a7	2019-08-23 12:02:06 +0100	[diff] [blame]	396	/** Dequantize a value given a 8-bit symmetric quantization scheme
Georgios Pinitas	3d13af8	2019-06-04 13:04:16 +0100	[diff] [blame]	397	*
				398	* @param[in] value Value to dequantize
				399	* @param[in] scale Scale to use for dequantization
				400	*
				401	* @return Dequantized value
				402	*/
				403	inline float dequantize(int8_t value, float scale)
				404	{
				405	return value * scale;
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	406	}
Manuel Bottini	3689fcd	2019-06-14 17:18:12 +0100	[diff] [blame]	407
Michele Di Giorgio	35ea9a7	2019-08-23 12:02:06 +0100	[diff] [blame]	408	/** Dequantize a value given a 16-bit symmetric quantization scheme
Manuel Bottini	10c53f1	2019-07-17 16:11:53 +0100	[diff] [blame]	409	*
				410	* @param[in] value Value to dequantize
				411	* @param[in] scale Scale to use for dequantization
				412	*
				413	* @return Dequantized value
				414	*/
				415	inline float dequantize(int16_t value, float scale)
				416	{
				417	return value * scale;
				418	}
				419
Michele Di Giorgio	35ea9a7	2019-08-23 12:02:06 +0100	[diff] [blame]	420	/** Dequantize a value given a 16-bit asymmetric quantization scheme
				421	*
				422	* @param[in] value Value to dequantize
				423	* @param[in] scale Scale to use for dequantization
				424	* @param[in] offset Zero-offset to use for dequantization
				425	*
				426	* @return Dequantized value
				427	*/
				428	inline float dequantize(uint16_t value, float scale, int32_t offset)
				429	{
				430	return (static_cast<int>(value) - offset) * scale;
				431	}
				432
Manuel Bottini	3689fcd	2019-06-14 17:18:12 +0100	[diff] [blame]	433	/** Quantize a value given a 16-bit symmetric quantization scheme
				434	*
				435	* @param[in] value Value to quantize
				436	* @param[in] qinfo Quantization information to use for quantizing
				437	* @param[in] rounding_policy (Optional) Rounding policy to use. Default: nearest up
				438	*
				439	* @return Quantized value
				440	*/
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	441	inline int16_t quantize_qsymm16(float value,
				442	const UniformQuantizationInfo &qinfo,
				443	RoundingPolicy rounding_policy = RoundingPolicy::TO_NEAREST_UP)
Manuel Bottini	3689fcd	2019-06-14 17:18:12 +0100	[diff] [blame]	444	{
				445	int quantized = arm_compute::round(value / qinfo.scale, rounding_policy);
				446	quantized = arm_compute::utility::clamp<int, int16_t>(quantized);
				447	return quantized;
				448	}
				449
				450	/** Dequantize a value given a 16-bit symmetric quantization scheme
				451	*
				452	* @param[in] value Value to dequantize
				453	* @param[in] qinfo Quantization information to use for dequantizing
				454	*
				455	* @return Dequantized value
				456	*/
				457	inline float dequantize_qsymm16(int16_t value, const UniformQuantizationInfo &qinfo)
				458	{
				459	return value * qinfo.scale;
				460	}
				461
				462	/** Quantize a value given a 16-bit symmetric quantization scheme
				463	*
				464	* @param[in] value Value to quantize
				465	* @param[in] qinfo Quantization information to use for quantizing
				466	*
				467	* @return Quantized value
				468	*/
				469	inline int16_t quantize_qsymm16(float value, const QuantizationInfo &qinfo)
				470	{
				471	return quantize_qsymm16(value, qinfo.uniform());
				472	}
				473
				474	/** Dequantize a value given a 16-bit symmetric quantization scheme
				475	*
				476	* @param[in] value Value to dequantize
				477	* @param[in] qinfo Quantization information to use for dequantizing
				478	*
				479	* @return Dequantized value
				480	*/
				481	inline float dequantize_qsymm16(int16_t value, const QuantizationInfo &qinfo)
				482	{
				483	return dequantize_qsymm16(value, qinfo.uniform());
				484	}
Michele Di Giorgio	35ea9a7	2019-08-23 12:02:06 +0100	[diff] [blame]	485
				486	/** Quantize a value given a 16-bit asymmetric quantization scheme
				487	*
				488	* @param[in] value Value to quantize
				489	* @param[in] qinfo Quantization information to use for quantizing
				490	* @param[in] rounding_policy (Optional) Rounding policy to use. Default: nearest up
				491	*
				492	* @return Quantized value
				493	*/
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	494	inline uint16_t quantize_qasymm16(float value,
				495	const UniformQuantizationInfo &qinfo,
				496	RoundingPolicy rounding_policy = RoundingPolicy::TO_NEAREST_UP)
Michele Di Giorgio	35ea9a7	2019-08-23 12:02:06 +0100	[diff] [blame]	497	{
				498	int quantized = arm_compute::round(value / qinfo.scale, rounding_policy) + qinfo.offset;
				499	quantized = arm_compute::utility::clamp<int, uint16_t>(quantized);
				500	return quantized;
				501	}
				502
				503	/** Dequantize a value given a 16-bit asymmetric quantization scheme
				504	*
				505	* @param[in] value Value to dequantize
				506	* @param[in] qinfo Quantization information to use for dequantizing
				507	*
				508	* @return Dequantized value
				509	*/
				510	inline float dequantize_qasymm16(uint16_t value, const UniformQuantizationInfo &qinfo)
				511	{
				512	return (static_cast<int>(value) - qinfo.offset) * qinfo.scale;
				513	}
				514
				515	/** Quantize a value given a 16-bit asymmetric quantization scheme
				516	*
				517	* @param[in] value Value to quantize
				518	* @param[in] qinfo Quantization information to use for quantizing
				519	*
				520	* @return Quantized value
				521	*/
				522	inline uint16_t quantize_qasymm16(float value, const QuantizationInfo &qinfo)
				523	{
				524	return quantize_qasymm16(value, qinfo.uniform());
				525	}
				526
				527	/** Dequantize a value given a 16-bit asymmetric quantization scheme
				528	*
				529	* @param[in] value Value to dequantize
				530	* @param[in] qinfo Quantization information to use for dequantizing
				531	*
				532	* @return Dequantized value
				533	*/
				534	inline float dequantize_qasymm16(uint16_t value, const QuantizationInfo &qinfo)
				535	{
				536	return dequantize_qasymm16(value, qinfo.uniform());
				537	}
Manuel Bottini	4370cff	2020-02-07 16:31:59 +0000	[diff] [blame]	538
				539	/*
				540	* In case of requantization of a quantized input tensor to an output tensor with another quantization
				541	* instead of applying dequantization and then a quantization functions, we just compute new scale and
				542	* offset.
				543	*
				544	* Assuming:
				545	* - q_i as input quantized value
				546	* - q_o as output quantized value
				547	* - z_i as input quantization offset value
				548	* - z_o as output quantization offset value
				549	* - s_i as input quantization scale value
				550	* - s_o as output quantization scale value
				551	* - z_n as new quantization offset value
				552	* - s_n as new quantization scale value
				553	*
				554	* q_o = ( q_i - z_i ) * s_i / s_o + z_o
				555	*
				556	* We can rewrite the formula as:
				557	*
				558	* q_o = ( q_i * s_i / s_o ) - z_i * s_i / s_o + z_o
				559	*
				560	* q_o = q_i / s_n + z_n
				561	*
				562	* Where:
				563	*
				564	* s_n = s_o / s_i
				565	*
				566	* z_n = - z_i * s_i / s_o + z_o
				567	*
				568	*/
Felix Thomasmathibalan	afd38f0	2023-09-27 17:46:17 +0100	[diff] [blame]	569	inline UniformQuantizationInfo compute_requantization_scale_offset(const UniformQuantizationInfo &uqinfo_in,
				570	const UniformQuantizationInfo &uqinfo_out)
Manuel Bottini	4370cff	2020-02-07 16:31:59 +0000	[diff] [blame]	571	{
				572	float scale_to_apply = uqinfo_out.scale;
				573	int32_t offset_to_apply = uqinfo_out.offset;
				574
				575	scale_to_apply /= uqinfo_in.scale;
				576	// In order to minimize flooring we convert the offset to a float,
				577	// then compute the new offset in the float domain,
				578	// finally we convert it back as int32_t
				579	offset_to_apply -= static_cast<int32_t>(static_cast<float>(uqinfo_in.offset) * uqinfo_in.scale / uqinfo_out.scale);
				580	return UniformQuantizationInfo(scale_to_apply, offset_to_apply);
				581	}
				582
Georgios Pinitas	4c5469b	2019-05-21 13:32:43 +0100	[diff] [blame]	583	} // namespace arm_compute
Sang-Hoon Park	ae6ef7c	2019-11-13 16:51:45 +0000	[diff] [blame]	584	#endif /* ARM_COMPUTE_QUANTIZATION_INFO_H */