blob: 66eb4ee28c7242846252a1ec172cf591bbdbaac8 [file] [log] [blame]
Narumol Prangnawaratea54a012020-03-16 16:36:10 +00001//
2// Copyright © 2020 Arm Ltd. All rights reserved.
3// SPDX-License-Identifier: MIT
4//
5
6#include "ConvertFp32ToBf16TestImpl.hpp"
7
8#include <backendsCommon/test/TensorCopyUtils.hpp>
9#include <backendsCommon/test/WorkloadTestUtils.hpp>
10
11#include <test/TensorHelpers.hpp>
12
13LayerTestResult<armnn::BFloat16, 4> ConvertFp32ToBf16Test(
14 armnn::IWorkloadFactory& workloadFactory,
15 const armnn::IBackendInternal::IMemoryManagerSharedPtr& memoryManager)
16{
17 IgnoreUnused(memoryManager);
18
19 const armnn::TensorInfo inputTensorInfo({1, 2, 4, 3}, armnn::DataType::Float32);
20 const armnn::TensorInfo outputTensorInfo({1, 2, 4, 3}, armnn::DataType::BFloat16);
21
22 auto input = MakeTensor<float, 4>(inputTensorInfo,
23 { -37.5f, -15.2f, -8.76f,
24 -2.0f, -1.5f, -1.3f,
25 -0.5f, -0.4f, 0.0f,
26 1.0f, 0.4f, 0.5f,
27 1.3f, 1.5f, 2.0f,
28 8.76f, 15.2f, 37.5f,
29 3.8f, // 0x40733333 Round down
30 3.1055E+29f, // 0x707ADC3C Round up
31 9.149516E-10f, // 0x307B7FFF Round down
32 -3.8f, // 0xC0733333 Round down
33 -3.1055E+29f, // 0xF07ADC3C Round up
34 -9.149516E-10f // 0xB07B7FFF Round down
35 });
36
37 std::vector<armnn::BFloat16> outputValues = armnnUtils::QuantizedVector<armnn::BFloat16>(
38 {
39 -37.5f, -15.2f, -8.76f,
40 -2.0f, -1.5f, -1.3f,
41 -0.5f, -0.4f, 0.0f,
42 1.0f, 0.4f, 0.5f,
43 1.3f, 1.5f, 2.0f,
44 8.76f, 15.2f, 37.5f,
45 3.796875f, // 0x4073
46 3.1072295E29f, // 0x707B
47 9.131327E-10f, // 0x307B
48 -3.796875f, // 0xC073
49 -3.1072295E29f, // 0xF07B
50 -9.131327E-10f // 0xB07B
51 },
52 1.0f, 0);
53
54 LayerTestResult<armnn::BFloat16, 4> ret(outputTensorInfo);
55 ret.outputExpected = MakeTensor<armnn::BFloat16, 4>(outputTensorInfo, outputValues);
56
57 std::unique_ptr<armnn::ITensorHandle> inputHandle = workloadFactory.CreateTensorHandle(inputTensorInfo);
58 std::unique_ptr<armnn::ITensorHandle> outputHandle = workloadFactory.CreateTensorHandle(outputTensorInfo);
59
60 armnn::ConvertFp32ToBf16QueueDescriptor data;
61 armnn::WorkloadInfo info;
62 AddInputToWorkload(data, info, inputTensorInfo, inputHandle.get());
63 AddOutputToWorkload(data, info, outputTensorInfo, outputHandle.get());
64
65 std::unique_ptr<armnn::IWorkload> workload = workloadFactory.CreateConvertFp32ToBf16(data, info);
66
67 inputHandle->Allocate();
68 outputHandle->Allocate();
69
70 CopyDataToITensorHandle(inputHandle.get(), &input[0][0][0][0]);
71
72 workload->Execute();
73
74 CopyDataFromITensorHandle(&ret.output[0][0][0][0], outputHandle.get());
75
76 return ret;
77}