COMPMID-2608: Enable quantization with multiplier greater than 1 on NEON
Change-Id: Ib2b0c9ac88fc2b645f478c9981f71ee28f2c77fd
Signed-off-by: Michele Di Giorgio <michele.digiorgio@arm.com>
Reviewed-on: https://review.mlplatform.org/c/2425
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Reviewed-by: Georgios Pinitas <georgios.pinitas@arm.com>
Tested-by: Arm Jenkins <bsgcomp@arm.com>
diff --git a/src/runtime/NEON/functions/NEGEMMLowpMatrixMultiplyCore.cpp b/src/runtime/NEON/functions/NEGEMMLowpMatrixMultiplyCore.cpp
index e36cb3d..440f043 100644
--- a/src/runtime/NEON/functions/NEGEMMLowpMatrixMultiplyCore.cpp
+++ b/src/runtime/NEON/functions/NEGEMMLowpMatrixMultiplyCore.cpp
@@ -344,6 +344,19 @@
{
run_optimised = bool(NEGEMMAssemblyDispatch::validate(a_to_use, b, c, output, gemm_info));
run_optimised_requantized = run_optimised;
+
+ const UniformQuantizationInfo a_qinfo = a_to_use->quantization_info().uniform();
+ const QuantizationInfo b_qinfo = b->quantization_info();
+ const UniformQuantizationInfo output_qinfo = output->quantization_info().uniform();
+ for(auto const s : b_qinfo.scale())
+ {
+ const float fmultipler = a_qinfo.scale * s / output_qinfo.scale;
+ if(fmultipler > 1.f)
+ {
+ run_optimised_requantized = false;
+ break;
+ }
+ }
}
else
{