telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 1 | // |
| 2 | // Copyright © 2017 Arm Ltd. All rights reserved. |
David Beck | ecb56cd | 2018-09-05 12:52:57 +0100 | [diff] [blame] | 3 | // SPDX-License-Identifier: MIT |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 4 | // |
| 5 | |
Aron Virginas-Tar | 5605519 | 2018-11-12 18:10:43 +0000 | [diff] [blame] | 6 | #include "NeonWorkloadFactoryHelper.hpp" |
| 7 | |
Aron Virginas-Tar | 3b278e9 | 2018-10-12 13:00:55 +0100 | [diff] [blame] | 8 | |
Colm Donelan | c42a987 | 2022-02-02 16:35:09 +0000 | [diff] [blame] | 9 | #include <armnnTestUtils/TensorHelpers.hpp> |
Aron Virginas-Tar | 3b278e9 | 2018-10-12 13:00:55 +0100 | [diff] [blame] | 10 | |
Colm Donelan | 0c47974 | 2021-12-10 12:43:54 +0000 | [diff] [blame] | 11 | #include <armnn/backends/TensorHandle.hpp> |
| 12 | #include <armnn/backends/WorkloadFactory.hpp> |
Aron Virginas-Tar | 3b278e9 | 2018-10-12 13:00:55 +0100 | [diff] [blame] | 13 | |
Aron Virginas-Tar | c9cc804 | 2018-11-01 16:15:57 +0000 | [diff] [blame] | 14 | #include <neon/NeonTimer.hpp> |
| 15 | #include <neon/NeonWorkloadFactory.hpp> |
Aron Virginas-Tar | 3b278e9 | 2018-10-12 13:00:55 +0100 | [diff] [blame] | 16 | |
Aron Virginas-Tar | c9cc804 | 2018-11-01 16:15:57 +0000 | [diff] [blame] | 17 | #include <backendsCommon/test/LayerTests.hpp> |
Sadik Armagan | a097d2a | 2021-11-24 15:47:28 +0000 | [diff] [blame] | 18 | #include <armnnTestUtils/TensorCopyUtils.hpp> |
Colm Donelan | 0c47974 | 2021-12-10 12:43:54 +0000 | [diff] [blame] | 19 | #include <armnnTestUtils/WorkloadTestUtils.hpp> |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 20 | |
Sadik Armagan | 1625efc | 2021-06-10 18:24:34 +0100 | [diff] [blame] | 21 | #include <doctest/doctest.h> |
Aron Virginas-Tar | 3b278e9 | 2018-10-12 13:00:55 +0100 | [diff] [blame] | 22 | |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 23 | #include <cstdlib> |
| 24 | #include <algorithm> |
| 25 | |
| 26 | using namespace armnn; |
| 27 | |
Sadik Armagan | 1625efc | 2021-06-10 18:24:34 +0100 | [diff] [blame] | 28 | TEST_SUITE("NeonTimerInstrument") |
| 29 | { |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 30 | |
Sadik Armagan | 1625efc | 2021-06-10 18:24:34 +0100 | [diff] [blame] | 31 | TEST_CASE("NeonTimerGetName") |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 32 | { |
| 33 | NeonTimer neonTimer; |
Sadik Armagan | 1625efc | 2021-06-10 18:24:34 +0100 | [diff] [blame] | 34 | CHECK_EQ(std::string(neonTimer.GetName()), "NeonKernelTimer"); |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 35 | } |
| 36 | |
Sadik Armagan | 1625efc | 2021-06-10 18:24:34 +0100 | [diff] [blame] | 37 | TEST_CASE("NeonTimerMeasure") |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 38 | { |
Aron Virginas-Tar | 5caf907 | 2018-11-14 18:35:18 +0000 | [diff] [blame] | 39 | NeonWorkloadFactory workloadFactory = |
| 40 | NeonWorkloadFactoryHelper::GetFactory(NeonWorkloadFactoryHelper::GetMemoryManager()); |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 41 | |
Conor Kennedy | f341d7f | 2019-05-27 13:20:38 +0100 | [diff] [blame] | 42 | unsigned int inputWidth = 2000u; |
| 43 | unsigned int inputHeight = 2000u; |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 44 | unsigned int inputChannels = 1u; |
| 45 | unsigned int inputBatchSize = 1u; |
| 46 | |
| 47 | float upperBound = 1.0f; |
| 48 | float lowerBound = -1.0f; |
| 49 | |
| 50 | size_t inputSize = inputWidth * inputHeight * inputChannels * inputBatchSize; |
| 51 | std::vector<float> inputData(inputSize, 0.f); |
| 52 | std::generate(inputData.begin(), inputData.end(), [](){ |
| 53 | return (static_cast<float>(rand()) / static_cast<float>(RAND_MAX / 3)) + 1.f; }); |
| 54 | |
| 55 | unsigned int outputWidth = inputWidth; |
| 56 | unsigned int outputHeight = inputHeight; |
| 57 | unsigned int outputChannels = inputChannels; |
| 58 | unsigned int outputBatchSize = inputBatchSize; |
| 59 | |
| 60 | armnn::TensorInfo inputTensorInfo({ inputBatchSize, inputChannels, inputHeight, inputWidth }, |
Nattapat Chaimanowong | 649dd95 | 2019-01-22 16:10:44 +0000 | [diff] [blame] | 61 | armnn::DataType::Float32); |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 62 | |
| 63 | armnn::TensorInfo outputTensorInfo({ outputBatchSize, outputChannels, outputHeight, outputWidth }, |
Nattapat Chaimanowong | 649dd95 | 2019-01-22 16:10:44 +0000 | [diff] [blame] | 64 | armnn::DataType::Float32); |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 65 | |
Teresa Charlin | e2a3b3f | 2020-08-17 23:22:11 +0100 | [diff] [blame] | 66 | ARMNN_NO_DEPRECATE_WARN_BEGIN |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 67 | std::unique_ptr<armnn::ITensorHandle> inputHandle = workloadFactory.CreateTensorHandle(inputTensorInfo); |
| 68 | std::unique_ptr<armnn::ITensorHandle> outputHandle = workloadFactory.CreateTensorHandle(outputTensorInfo); |
Teresa Charlin | e2a3b3f | 2020-08-17 23:22:11 +0100 | [diff] [blame] | 69 | ARMNN_NO_DEPRECATE_WARN_END |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 70 | |
| 71 | // Setup bounded ReLu |
| 72 | armnn::ActivationQueueDescriptor descriptor; |
| 73 | armnn::WorkloadInfo workloadInfo; |
| 74 | AddInputToWorkload(descriptor, workloadInfo, inputTensorInfo, inputHandle.get()); |
| 75 | AddOutputToWorkload(descriptor, workloadInfo, outputTensorInfo, outputHandle.get()); |
| 76 | |
| 77 | descriptor.m_Parameters.m_Function = armnn::ActivationFunction::BoundedReLu; |
| 78 | descriptor.m_Parameters.m_A = upperBound; |
| 79 | descriptor.m_Parameters.m_B = lowerBound; |
| 80 | |
Teresa Charlin | 611c7fb | 2022-01-07 09:47:29 +0000 | [diff] [blame] | 81 | std::unique_ptr<armnn::IWorkload> workload |
| 82 | = workloadFactory.CreateWorkload(LayerType::Activation, descriptor, workloadInfo); |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 83 | |
| 84 | inputHandle->Allocate(); |
| 85 | outputHandle->Allocate(); |
| 86 | |
Sadik Armagan | 483c811 | 2021-06-01 09:24:52 +0100 | [diff] [blame] | 87 | CopyDataToITensorHandle(inputHandle.get(), inputData.data()); |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 88 | |
| 89 | NeonTimer neonTimer; |
| 90 | // Start the timer. |
| 91 | neonTimer.Start(); |
| 92 | // Execute the workload. |
| 93 | workload->Execute(); |
| 94 | // Stop the timer. |
| 95 | neonTimer.Stop(); |
| 96 | |
| 97 | std::vector<Measurement> measurements = neonTimer.GetMeasurements(); |
| 98 | |
Sadik Armagan | 1625efc | 2021-06-10 18:24:34 +0100 | [diff] [blame] | 99 | CHECK(measurements.size() <= 2); |
Matthew Bentham | 679efda | 2018-12-10 13:14:37 +0000 | [diff] [blame] | 100 | if (measurements.size() > 1) |
| 101 | { |
Sadik Armagan | 1625efc | 2021-06-10 18:24:34 +0100 | [diff] [blame] | 102 | CHECK_EQ(measurements[0].m_Name, "NeonKernelTimer/0: NEFillBorderKernel"); |
| 103 | CHECK(measurements[0].m_Value > 0.0); |
Matthew Bentham | 679efda | 2018-12-10 13:14:37 +0000 | [diff] [blame] | 104 | } |
Nikhil Raj | 13816cd | 2021-01-12 14:29:18 +0000 | [diff] [blame] | 105 | std::ostringstream oss_neon; |
| 106 | std::ostringstream oss_cpu; |
| 107 | oss_neon << "NeonKernelTimer/" << measurements.size()-1 << ": NEActivationLayerKernel"; |
| 108 | oss_cpu << "NeonKernelTimer/" << measurements.size()-1 << ": CpuActivationKernel"; |
Nikhil Raj | 7af2fd7 | 2021-06-30 11:51:10 +0100 | [diff] [blame] | 109 | bool kernelCheck = ((measurements[measurements.size()-1].m_Name.find(oss_neon.str()) != std::string::npos) |
| 110 | || (measurements[measurements.size()-1].m_Name.find(oss_cpu.str()) != std::string::npos)); |
| 111 | CHECK(kernelCheck); |
Sadik Armagan | 1625efc | 2021-06-10 18:24:34 +0100 | [diff] [blame] | 112 | CHECK(measurements[measurements.size()-1].m_Value > 0.0); |
telsoa01 | c577f2c | 2018-08-31 09:22:23 +0100 | [diff] [blame] | 113 | } |
| 114 | |
Sadik Armagan | 1625efc | 2021-06-10 18:24:34 +0100 | [diff] [blame] | 115 | } |