blob: 024b74eea4a8bc7dbfaef097ee8c6c3ed961b15c [file] [log] [blame]
telsoa01c577f2c2018-08-31 09:22:23 +01001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa01c577f2c2018-08-31 09:22:23 +01004//
5
Matteo Martincighe011d202019-11-28 11:35:47 +00006#include <armnnUtils/FloatingPointConverter.hpp>
arovir01616e7752018-10-01 17:08:59 +01007
Narumol Prangnawarat88325222020-03-06 14:45:57 +00008#include "BFloat16.hpp"
arovir01616e7752018-10-01 17:08:59 +01009#include "Half.hpp"
telsoa01c577f2c2018-08-31 09:22:23 +010010
Narumol Prangnawaratac2770a2020-04-01 16:51:23 +010011#include <armnn/utility/Assert.hpp>
telsoa01c577f2c2018-08-31 09:22:23 +010012
13namespace armnnUtils
14{
15
16void FloatingPointConverter::ConvertFloat32To16(const float* srcFloat32Buffer,
17 size_t numElements,
18 void* dstFloat16Buffer)
19{
Narumol Prangnawaratac2770a2020-04-01 16:51:23 +010020 ARMNN_ASSERT(srcFloat32Buffer != nullptr);
21 ARMNN_ASSERT(dstFloat16Buffer != nullptr);
telsoa01c577f2c2018-08-31 09:22:23 +010022
Ryan OSheaf4bfa6a2020-06-10 11:33:37 +010023 armnn::Half* pHalf = static_cast<armnn::Half*>(dstFloat16Buffer);
telsoa01c577f2c2018-08-31 09:22:23 +010024
25 for (size_t i = 0; i < numElements; i++)
26 {
27 pHalf[i] = armnn::Half(srcFloat32Buffer[i]);
Narumol Prangnawarat9f62d332023-07-11 16:49:00 +010028 if (isinf(pHalf[i]))
29 {
30 // If the value of converted Fp16 is infinity, round to the closest finite Fp16 value.
31 pHalf[i] = copysign(std::numeric_limits<armnn::Half>::max(), pHalf[i]);
32 }
telsoa01c577f2c2018-08-31 09:22:23 +010033 }
34}
35
36void FloatingPointConverter::ConvertFloat16To32(const void* srcFloat16Buffer,
37 size_t numElements,
38 float* dstFloat32Buffer)
39{
Narumol Prangnawaratac2770a2020-04-01 16:51:23 +010040 ARMNN_ASSERT(srcFloat16Buffer != nullptr);
41 ARMNN_ASSERT(dstFloat32Buffer != nullptr);
telsoa01c577f2c2018-08-31 09:22:23 +010042
Ryan OSheaf4bfa6a2020-06-10 11:33:37 +010043 const armnn::Half* pHalf = static_cast<const armnn::Half*>(srcFloat16Buffer);
telsoa01c577f2c2018-08-31 09:22:23 +010044
45 for (size_t i = 0; i < numElements; i++)
46 {
47 dstFloat32Buffer[i] = pHalf[i];
48 }
49}
50
telsoa01c577f2c2018-08-31 09:22:23 +010051} //namespace armnnUtils