blob: ff27048b3cec360183526e3007e34f55c0a5963e [file] [log] [blame]
telsoa01c577f2c2018-08-31 09:22:23 +01001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa01c577f2c2018-08-31 09:22:23 +01004//
5
Aron Virginas-Tar56055192018-11-12 18:10:43 +00006#include "NeonWorkloadFactoryHelper.hpp"
7
Aron Virginas-Tar3b278e92018-10-12 13:00:55 +01008
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +00009#include <test/TensorHelpers.hpp>
Aron Virginas-Tar3b278e92018-10-12 13:00:55 +010010
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000011#include <backendsCommon/CpuTensorHandle.hpp>
12#include <backendsCommon/WorkloadFactory.hpp>
Aron Virginas-Tar3b278e92018-10-12 13:00:55 +010013
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000014#include <neon/NeonTimer.hpp>
15#include <neon/NeonWorkloadFactory.hpp>
Aron Virginas-Tar3b278e92018-10-12 13:00:55 +010016
Aron Virginas-Tarc9cc8042018-11-01 16:15:57 +000017#include <backendsCommon/test/LayerTests.hpp>
18#include <backendsCommon/test/TensorCopyUtils.hpp>
19#include <backendsCommon/test/WorkloadTestUtils.hpp>
telsoa01c577f2c2018-08-31 09:22:23 +010020
21#include <boost/test/unit_test.hpp>
Aron Virginas-Tar3b278e92018-10-12 13:00:55 +010022
telsoa01c577f2c2018-08-31 09:22:23 +010023#include <cstdlib>
24#include <algorithm>
25
26using namespace armnn;
27
28BOOST_AUTO_TEST_SUITE(NeonTimerInstrument)
29
30
31BOOST_AUTO_TEST_CASE(NeonTimerGetName)
32{
33 NeonTimer neonTimer;
34 BOOST_CHECK_EQUAL(neonTimer.GetName(), "NeonKernelTimer");
35}
36
37BOOST_AUTO_TEST_CASE(NeonTimerMeasure)
38{
Aron Virginas-Tar5caf9072018-11-14 18:35:18 +000039 NeonWorkloadFactory workloadFactory =
40 NeonWorkloadFactoryHelper::GetFactory(NeonWorkloadFactoryHelper::GetMemoryManager());
telsoa01c577f2c2018-08-31 09:22:23 +010041
Conor Kennedyf341d7f2019-05-27 13:20:38 +010042 unsigned int inputWidth = 2000u;
43 unsigned int inputHeight = 2000u;
telsoa01c577f2c2018-08-31 09:22:23 +010044 unsigned int inputChannels = 1u;
45 unsigned int inputBatchSize = 1u;
46
47 float upperBound = 1.0f;
48 float lowerBound = -1.0f;
49
50 size_t inputSize = inputWidth * inputHeight * inputChannels * inputBatchSize;
51 std::vector<float> inputData(inputSize, 0.f);
52 std::generate(inputData.begin(), inputData.end(), [](){
53 return (static_cast<float>(rand()) / static_cast<float>(RAND_MAX / 3)) + 1.f; });
54
55 unsigned int outputWidth = inputWidth;
56 unsigned int outputHeight = inputHeight;
57 unsigned int outputChannels = inputChannels;
58 unsigned int outputBatchSize = inputBatchSize;
59
60 armnn::TensorInfo inputTensorInfo({ inputBatchSize, inputChannels, inputHeight, inputWidth },
Nattapat Chaimanowong649dd952019-01-22 16:10:44 +000061 armnn::DataType::Float32);
telsoa01c577f2c2018-08-31 09:22:23 +010062
63 armnn::TensorInfo outputTensorInfo({ outputBatchSize, outputChannels, outputHeight, outputWidth },
Nattapat Chaimanowong649dd952019-01-22 16:10:44 +000064 armnn::DataType::Float32);
telsoa01c577f2c2018-08-31 09:22:23 +010065
66 LayerTestResult<float, 4> result(inputTensorInfo);
67
68 auto input = MakeTensor<float, 4>(inputTensorInfo, inputData);
69
Teresa Charline2a3b3f2020-08-17 23:22:11 +010070 ARMNN_NO_DEPRECATE_WARN_BEGIN
telsoa01c577f2c2018-08-31 09:22:23 +010071 std::unique_ptr<armnn::ITensorHandle> inputHandle = workloadFactory.CreateTensorHandle(inputTensorInfo);
72 std::unique_ptr<armnn::ITensorHandle> outputHandle = workloadFactory.CreateTensorHandle(outputTensorInfo);
Teresa Charline2a3b3f2020-08-17 23:22:11 +010073 ARMNN_NO_DEPRECATE_WARN_END
telsoa01c577f2c2018-08-31 09:22:23 +010074
75 // Setup bounded ReLu
76 armnn::ActivationQueueDescriptor descriptor;
77 armnn::WorkloadInfo workloadInfo;
78 AddInputToWorkload(descriptor, workloadInfo, inputTensorInfo, inputHandle.get());
79 AddOutputToWorkload(descriptor, workloadInfo, outputTensorInfo, outputHandle.get());
80
81 descriptor.m_Parameters.m_Function = armnn::ActivationFunction::BoundedReLu;
82 descriptor.m_Parameters.m_A = upperBound;
83 descriptor.m_Parameters.m_B = lowerBound;
84
85 std::unique_ptr<armnn::IWorkload> workload = workloadFactory.CreateActivation(descriptor, workloadInfo);
86
87 inputHandle->Allocate();
88 outputHandle->Allocate();
89
90 CopyDataToITensorHandle(inputHandle.get(), &input[0][0][0][0]);
91
92 NeonTimer neonTimer;
93 // Start the timer.
94 neonTimer.Start();
95 // Execute the workload.
96 workload->Execute();
97 // Stop the timer.
98 neonTimer.Stop();
99
100 std::vector<Measurement> measurements = neonTimer.GetMeasurements();
101
Matthew Bentham679efda2018-12-10 13:14:37 +0000102 BOOST_CHECK(measurements.size() <= 2);
103 if (measurements.size() > 1)
104 {
105 BOOST_CHECK_EQUAL(measurements[0].m_Name, "NeonKernelTimer/0: NEFillBorderKernel");
106 BOOST_CHECK(measurements[0].m_Value > 0.0);
107 }
Matthew Benthamf8d63012018-12-10 17:05:25 +0000108 std::ostringstream oss;
109 oss << "NeonKernelTimer/" << measurements.size()-1 << ": NEActivationLayerKernel";
110 BOOST_CHECK_EQUAL(measurements[measurements.size()-1].m_Name, oss.str());
Matthew Bentham679efda2018-12-10 13:14:37 +0000111 BOOST_CHECK(measurements[measurements.size()-1].m_Value > 0.0);
telsoa01c577f2c2018-08-31 09:22:23 +0100112}
113
114BOOST_AUTO_TEST_SUITE_END()