blob: a588a3ecc812baca632ff3710257ec7ff2b32f61 [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
arovir0143095f32018-10-09 18:04:24 +01005
arovir0143095f32018-10-09 18:04:24 +01006#include <backends/MemCopyWorkload.hpp>
Aron Virginas-Tar3b278e92018-10-12 13:00:55 +01007
8#include <backends/aclCommon/test/CreateWorkloadClNeon.hpp>
9
David Beck0dbe0ee2018-09-24 15:59:27 +010010#include <backends/neon/NeonWorkloadFactory.hpp>
11#include <backends/neon/NeonTensorHandle.hpp>
12#include <backends/neon/workloads/NeonWorkloadUtils.hpp>
13#include <backends/neon/workloads/NeonWorkloads.hpp>
telsoa014fcda012018-03-09 14:13:49 +000014
15BOOST_AUTO_TEST_SUITE(CreateWorkloadNeon)
16
17namespace
18{
19
20bool TestNeonTensorHandleInfo(armnn::INeonTensorHandle* handle, const armnn::TensorInfo& expectedInfo)
21{
22 using namespace armnn::armcomputetensorutils;
23
24 const arm_compute::ITensorInfo* handleInfo = handle->GetTensor().info();
25 const arm_compute::TensorInfo expectedAclInfo = BuildArmComputeTensorInfo(expectedInfo);
26
27 if (handleInfo->data_type() != expectedAclInfo.data_type())
28 {
29 return false;
30 }
31
32 if (handleInfo->num_dimensions() != expectedAclInfo.num_dimensions())
33 {
34 return false;
35 }
36
37 if (handleInfo->quantization_info() != expectedAclInfo.quantization_info())
38 {
39 return false;
40 }
41
42 for (std::size_t d = 0; d < expectedAclInfo.num_dimensions(); ++d)
43 {
44 if (handleInfo->dimension(d) != expectedAclInfo.dimension(d))
45 {
46 return false;
47 }
48 }
49
50 return true;
51}
52
53} // namespace
54
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +010055template <typename armnn::DataType DataType>
telsoa01c577f2c2018-08-31 09:22:23 +010056static void NeonCreateActivationWorkloadTest()
telsoa014fcda012018-03-09 14:13:49 +000057{
58 Graph graph;
59 NeonWorkloadFactory factory;
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +010060 auto workload = CreateActivationWorkloadTest<NeonActivationWorkload, DataType>(factory, graph);
telsoa014fcda012018-03-09 14:13:49 +000061
telsoa01c577f2c2018-08-31 09:22:23 +010062 // Checks that inputs/outputs are as we expect them (see definition of CreateActivationWorkloadTest).
telsoa014fcda012018-03-09 14:13:49 +000063 ActivationQueueDescriptor queueDescriptor = workload->GetData();
64 auto inputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
65 auto outputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
telsoa01c577f2c2018-08-31 09:22:23 +010066 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle, TensorInfo({1, 1}, DataType)));
67 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle, TensorInfo({1, 1}, DataType)));
telsoa014fcda012018-03-09 14:13:49 +000068}
69
telsoa01c577f2c2018-08-31 09:22:23 +010070#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
71BOOST_AUTO_TEST_CASE(CreateActivationFloat16Workload)
72{
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +010073 NeonCreateActivationWorkloadTest<DataType::Float16>();
telsoa01c577f2c2018-08-31 09:22:23 +010074}
75#endif
76
arovir019e53a352018-08-31 15:26:35 +010077BOOST_AUTO_TEST_CASE(CreateActivationFloatWorkload)
telsoa01c577f2c2018-08-31 09:22:23 +010078{
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +010079 NeonCreateActivationWorkloadTest<DataType::Float32>();
telsoa01c577f2c2018-08-31 09:22:23 +010080}
81
David Beckbc392452018-09-10 14:47:28 +010082template <typename WorkloadType,
83 typename DescriptorType,
84 typename LayerType,
85 armnn::DataType DataType>
86static void NeonCreateArithmethicWorkloadTest()
telsoa014fcda012018-03-09 14:13:49 +000087{
David Beckbc392452018-09-10 14:47:28 +010088 Graph graph;
telsoa014fcda012018-03-09 14:13:49 +000089 NeonWorkloadFactory factory;
David Beckbc392452018-09-10 14:47:28 +010090 auto workload = CreateArithmeticWorkloadTest<WorkloadType, DescriptorType, LayerType, DataType>(factory, graph);
telsoa014fcda012018-03-09 14:13:49 +000091
David Beckbc392452018-09-10 14:47:28 +010092 DescriptorType queueDescriptor = workload->GetData();
telsoa014fcda012018-03-09 14:13:49 +000093 auto inputHandle1 = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
94 auto inputHandle2 = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[1]);
95 auto outputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
telsoa01c577f2c2018-08-31 09:22:23 +010096 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle1, TensorInfo({2, 3}, DataType)));
97 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle2, TensorInfo({2, 3}, DataType)));
98 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle, TensorInfo({2, 3}, DataType)));
telsoa014fcda012018-03-09 14:13:49 +000099}
100
telsoa01c577f2c2018-08-31 09:22:23 +0100101#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
102BOOST_AUTO_TEST_CASE(CreateAdditionFloat16Workload)
103{
David Beckbc392452018-09-10 14:47:28 +0100104 NeonCreateArithmethicWorkloadTest<NeonAdditionFloatWorkload,
105 AdditionQueueDescriptor,
106 AdditionLayer,
107 DataType::Float16>();
telsoa01c577f2c2018-08-31 09:22:23 +0100108}
109#endif
110
arovir019e53a352018-08-31 15:26:35 +0100111BOOST_AUTO_TEST_CASE(CreateAdditionFloatWorkload)
telsoa01c577f2c2018-08-31 09:22:23 +0100112{
David Beckbc392452018-09-10 14:47:28 +0100113 NeonCreateArithmethicWorkloadTest<NeonAdditionFloatWorkload,
114 AdditionQueueDescriptor,
115 AdditionLayer,
116 DataType::Float32>();
117}
118
119#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
120BOOST_AUTO_TEST_CASE(CreateSubtractionFloat16Workload)
121{
122 NeonCreateArithmethicWorkloadTest<NeonSubtractionFloatWorkload,
123 SubtractionQueueDescriptor,
124 SubtractionLayer,
125 DataType::Float16>();
126}
127#endif
128
129BOOST_AUTO_TEST_CASE(CreateSubtractionFloatWorkload)
130{
131 NeonCreateArithmethicWorkloadTest<NeonSubtractionFloatWorkload,
132 SubtractionQueueDescriptor,
133 SubtractionLayer,
134 DataType::Float32>();
135}
136
137#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
138BOOST_AUTO_TEST_CASE(CreateMultiplicationFloat16Workload)
139{
140 NeonCreateArithmethicWorkloadTest<NeonMultiplicationFloatWorkload,
141 MultiplicationQueueDescriptor,
142 MultiplicationLayer,
143 DataType::Float16>();
144}
145#endif
146
147BOOST_AUTO_TEST_CASE(CreateMultiplicationFloatWorkload)
148{
149 NeonCreateArithmethicWorkloadTest<NeonMultiplicationFloatWorkload,
150 MultiplicationQueueDescriptor,
151 MultiplicationLayer,
152 DataType::Float32>();
telsoa01c577f2c2018-08-31 09:22:23 +0100153}
154
155template <typename BatchNormalizationWorkloadType, typename armnn::DataType DataType>
156static void NeonCreateBatchNormalizationWorkloadTest()
telsoa014fcda012018-03-09 14:13:49 +0000157{
158 Graph graph;
159 NeonWorkloadFactory factory;
telsoa01c577f2c2018-08-31 09:22:23 +0100160 auto workload = CreateBatchNormalizationWorkloadTest<BatchNormalizationWorkloadType, DataType>(factory, graph);
telsoa014fcda012018-03-09 14:13:49 +0000161
telsoa01c577f2c2018-08-31 09:22:23 +0100162 // Checks that outputs and inputs are as we expect them (see definition of CreateBatchNormalizationWorkloadTest).
telsoa014fcda012018-03-09 14:13:49 +0000163 BatchNormalizationQueueDescriptor queueDescriptor = workload->GetData();
164 auto inputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
165 auto outputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
telsoa01c577f2c2018-08-31 09:22:23 +0100166 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle, TensorInfo({2, 3, 1, 1}, DataType)));
167 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle, TensorInfo({2, 3, 1, 1}, DataType)));
telsoa014fcda012018-03-09 14:13:49 +0000168}
169
telsoa01c577f2c2018-08-31 09:22:23 +0100170#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
171BOOST_AUTO_TEST_CASE(CreateBatchNormalizationFloat16Workload)
172{
arovir019e53a352018-08-31 15:26:35 +0100173 NeonCreateBatchNormalizationWorkloadTest<NeonBatchNormalizationFloatWorkload, DataType::Float16>();
telsoa01c577f2c2018-08-31 09:22:23 +0100174}
175#endif
176
arovir019e53a352018-08-31 15:26:35 +0100177BOOST_AUTO_TEST_CASE(CreateBatchNormalizationFloatWorkload)
telsoa01c577f2c2018-08-31 09:22:23 +0100178{
arovir019e53a352018-08-31 15:26:35 +0100179 NeonCreateBatchNormalizationWorkloadTest<NeonBatchNormalizationFloatWorkload, DataType::Float32>();
telsoa01c577f2c2018-08-31 09:22:23 +0100180}
181
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100182template <typename armnn::DataType DataType>
Francis Murtagh0d9d4192018-10-09 16:22:33 +0100183static void NeonCreateConvolution2dWorkloadTest(DataLayout dataLayout = DataLayout::NCHW)
telsoa014fcda012018-03-09 14:13:49 +0000184{
185 Graph graph;
186 NeonWorkloadFactory factory;
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100187 auto workload = CreateConvolution2dWorkloadTest<NeonConvolution2dWorkload,
Francis Murtagh0d9d4192018-10-09 16:22:33 +0100188 DataType>(factory, graph, dataLayout);
189
190 TensorShape inputShape = (dataLayout == DataLayout::NCHW) ? TensorShape{2, 3, 8, 16} : TensorShape{2, 8, 16, 3};
191 TensorShape outputShape = (dataLayout == DataLayout::NCHW) ? TensorShape{2, 2, 2, 10} : TensorShape{2, 2, 10, 2};
telsoa014fcda012018-03-09 14:13:49 +0000192
telsoa01c577f2c2018-08-31 09:22:23 +0100193 // Checks that outputs and inputs are as we expect them (see definition of CreateConvolution2dWorkloadTest).
telsoa014fcda012018-03-09 14:13:49 +0000194 Convolution2dQueueDescriptor queueDescriptor = workload->GetData();
195 auto inputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
196 auto outputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
Francis Murtagh0d9d4192018-10-09 16:22:33 +0100197 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle, TensorInfo(inputShape, DataType)));
198 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle, TensorInfo(outputShape, DataType)));
telsoa014fcda012018-03-09 14:13:49 +0000199}
200
telsoa01c577f2c2018-08-31 09:22:23 +0100201#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
Francis Murtagh0d9d4192018-10-09 16:22:33 +0100202BOOST_AUTO_TEST_CASE(CreateConvolution2dFloat16NchwWorkload)
telsoa01c577f2c2018-08-31 09:22:23 +0100203{
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100204 NeonCreateConvolution2dWorkloadTest<DataType::Float16>();
telsoa01c577f2c2018-08-31 09:22:23 +0100205}
telsoa01c577f2c2018-08-31 09:22:23 +0100206
Francis Murtagh0d9d4192018-10-09 16:22:33 +0100207BOOST_AUTO_TEST_CASE(CreateConvolution2dFloat16NhwcWorkload)
208{
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100209 NeonCreateConvolution2dWorkloadTest<DataType::Float16>(DataLayout::NHWC);
Francis Murtagh0d9d4192018-10-09 16:22:33 +0100210}
211
212#endif
213BOOST_AUTO_TEST_CASE(CreateConvolution2dFloatNchwWorkload)
telsoa01c577f2c2018-08-31 09:22:23 +0100214{
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100215 NeonCreateConvolution2dWorkloadTest<DataType::Float32>();
telsoa01c577f2c2018-08-31 09:22:23 +0100216}
217
Francis Murtagh0d9d4192018-10-09 16:22:33 +0100218BOOST_AUTO_TEST_CASE(CreateConvolution2dFloatNhwcWorkload)
219{
Nattapat Chaimanowong974b65f2018-10-15 15:07:34 +0100220 NeonCreateConvolution2dWorkloadTest<DataType::Float32>(DataLayout::NHWC);
Francis Murtagh0d9d4192018-10-09 16:22:33 +0100221}
222
Nattapat Chaimanowong77140882018-10-17 11:12:19 +0100223template <typename armnn::DataType DataType>
Nikhil Rajcec6b652018-10-12 13:51:57 +0100224static void NeonCreateDepthWiseConvolutionWorkloadTest(DataLayout dataLayout)
225{
226 Graph graph;
227 NeonWorkloadFactory factory;
228
Nattapat Chaimanowong77140882018-10-17 11:12:19 +0100229 auto workload = CreateDepthwiseConvolution2dWorkloadTest<NeonDepthwiseConvolutionWorkload,
Nikhil Rajcec6b652018-10-12 13:51:57 +0100230 DataType>(factory, graph, dataLayout);
231
232 // Checks that inputs/outputs are as we expect them (see definition of CreateNormalizationWorkloadTest).
233 DepthwiseConvolution2dQueueDescriptor queueDescriptor = workload->GetData();
234 auto inputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
235 auto outputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
236
237 std::initializer_list<unsigned int> inputShape = (dataLayout == DataLayout::NCHW)
238 ? std::initializer_list<unsigned int>({ 2, 2, 5, 5 })
239 : std::initializer_list<unsigned int>({ 2, 5, 5, 2 });
240 std::initializer_list<unsigned int> outputShape = (dataLayout == DataLayout::NCHW)
241 ? std::initializer_list<unsigned int>({ 2, 2, 5, 5 })
242 : std::initializer_list<unsigned int>({ 2, 5, 5, 2 });
243
244 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle, TensorInfo(inputShape, DataType)));
245 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle, TensorInfo(outputShape, DataType)));
246}
247
248BOOST_AUTO_TEST_CASE(CreateDepthWiseConvolution2dFloat32NhwcWorkload)
249{
Nattapat Chaimanowong77140882018-10-17 11:12:19 +0100250 NeonCreateDepthWiseConvolutionWorkloadTest<DataType::Float32>(DataLayout::NHWC);
Nikhil Rajcec6b652018-10-12 13:51:57 +0100251}
252
253#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
254BOOST_AUTO_TEST_CASE(CreateDepthWiseConvolution2dFloat16NhwcWorkload)
255{
Nattapat Chaimanowong77140882018-10-17 11:12:19 +0100256 NeonCreateDepthWiseConvolutionWorkloadTest<DataType::Float16>(DataLayout::NHWC);
Nikhil Rajcec6b652018-10-12 13:51:57 +0100257}
258#endif
259
telsoa01c577f2c2018-08-31 09:22:23 +0100260template <typename FullyConnectedWorkloadType, typename armnn::DataType DataType>
261static void NeonCreateFullyConnectedWorkloadTest()
telsoa014fcda012018-03-09 14:13:49 +0000262{
263 Graph graph;
264 NeonWorkloadFactory factory;
telsoa01c577f2c2018-08-31 09:22:23 +0100265 auto workload = CreateFullyConnectedWorkloadTest<FullyConnectedWorkloadType,
266 DataType>(factory, graph);
telsoa014fcda012018-03-09 14:13:49 +0000267
telsoa01c577f2c2018-08-31 09:22:23 +0100268 // Checks that outputs and inputs are as we expect them (see definition of CreateFullyConnectedWorkloadTest).
telsoa014fcda012018-03-09 14:13:49 +0000269 FullyConnectedQueueDescriptor queueDescriptor = workload->GetData();
270 auto inputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
271 auto outputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
telsoa01c577f2c2018-08-31 09:22:23 +0100272 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle, TensorInfo({3, 1, 4, 5}, DataType)));
273 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle, TensorInfo({3, 7}, DataType)));
telsoa014fcda012018-03-09 14:13:49 +0000274}
275
telsoa01c577f2c2018-08-31 09:22:23 +0100276#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
277BOOST_AUTO_TEST_CASE(CreateFullyConnectedFloat16Workload)
278{
kevmay01e448be32018-09-26 10:21:55 +0100279 NeonCreateFullyConnectedWorkloadTest<NeonFullyConnectedWorkload, DataType::Float16>();
telsoa01c577f2c2018-08-31 09:22:23 +0100280}
281#endif
282
arovir019e53a352018-08-31 15:26:35 +0100283BOOST_AUTO_TEST_CASE(CreateFullyConnectedFloatWorkload)
telsoa01c577f2c2018-08-31 09:22:23 +0100284{
kevmay01e448be32018-09-26 10:21:55 +0100285 NeonCreateFullyConnectedWorkloadTest<NeonFullyConnectedWorkload, DataType::Float32>();
telsoa01c577f2c2018-08-31 09:22:23 +0100286}
287
telsoa01c577f2c2018-08-31 09:22:23 +0100288template <typename NormalizationWorkloadType, typename armnn::DataType DataType>
narpra0155a97bc2018-10-02 14:35:53 +0100289static void NeonCreateNormalizationWorkloadTest(DataLayout dataLayout)
telsoa014fcda012018-03-09 14:13:49 +0000290{
narpra0155a97bc2018-10-02 14:35:53 +0100291 Graph graph;
telsoa014fcda012018-03-09 14:13:49 +0000292 NeonWorkloadFactory factory;
narpra0155a97bc2018-10-02 14:35:53 +0100293 auto workload = CreateNormalizationWorkloadTest<NormalizationWorkloadType, DataType>(factory, graph, dataLayout);
telsoa014fcda012018-03-09 14:13:49 +0000294
telsoa01c577f2c2018-08-31 09:22:23 +0100295 // Checks that outputs and inputs are as we expect them (see definition of CreateNormalizationWorkloadTest).
telsoa014fcda012018-03-09 14:13:49 +0000296 NormalizationQueueDescriptor queueDescriptor = workload->GetData();
297 auto inputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
298 auto outputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
Matteo Martincigha160b242018-10-18 10:33:23 +0100299
300 TensorShape inputShape = (dataLayout == DataLayout::NCHW) ? TensorShape{3, 5, 5, 1} : TensorShape{3, 1, 5, 5};
301 TensorShape outputShape = (dataLayout == DataLayout::NCHW) ? TensorShape{3, 5, 5, 1} : TensorShape{3, 1, 5, 5};
302
303 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle, TensorInfo(inputShape, DataType)));
304 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle, TensorInfo(outputShape, DataType)));
telsoa014fcda012018-03-09 14:13:49 +0000305}
306
telsoa01c577f2c2018-08-31 09:22:23 +0100307#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
narpra0155a97bc2018-10-02 14:35:53 +0100308BOOST_AUTO_TEST_CASE(CreateNormalizationFloat16NchwWorkload)
telsoa01c577f2c2018-08-31 09:22:23 +0100309{
narpra0155a97bc2018-10-02 14:35:53 +0100310 NeonCreateNormalizationWorkloadTest<NeonNormalizationFloatWorkload, DataType::Float16>(DataLayout::NCHW);
311}
312
313BOOST_AUTO_TEST_CASE(CreateNormalizationFloat16NhwcWorkload)
314{
315 NeonCreateNormalizationWorkloadTest<NeonNormalizationFloatWorkload, DataType::Float16>(DataLayout::NHWC);
telsoa01c577f2c2018-08-31 09:22:23 +0100316}
317#endif
318
narpra0155a97bc2018-10-02 14:35:53 +0100319BOOST_AUTO_TEST_CASE(CreateNormalizationFloatNchwWorkload)
telsoa01c577f2c2018-08-31 09:22:23 +0100320{
narpra0155a97bc2018-10-02 14:35:53 +0100321 NeonCreateNormalizationWorkloadTest<NeonNormalizationFloatWorkload, DataType::Float32>(DataLayout::NCHW);
telsoa01c577f2c2018-08-31 09:22:23 +0100322}
323
narpra0155a97bc2018-10-02 14:35:53 +0100324BOOST_AUTO_TEST_CASE(CreateNormalizationFloatNhwcWorkload)
325{
326 NeonCreateNormalizationWorkloadTest<NeonNormalizationFloatWorkload, DataType::Float32>(DataLayout::NHWC);
327}
328
329
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +0100330template <typename armnn::DataType DataType>
Nina Drozdb48e6862018-10-09 12:09:56 +0100331static void NeonCreatePooling2dWorkloadTest(DataLayout dataLayout = DataLayout::NCHW)
telsoa014fcda012018-03-09 14:13:49 +0000332{
333 Graph graph;
334 NeonWorkloadFactory factory;
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +0100335 auto workload = CreatePooling2dWorkloadTest<NeonPooling2dWorkload, DataType>
Nina Drozdb48e6862018-10-09 12:09:56 +0100336 (factory, graph, dataLayout);
337
338 TensorShape inputShape = (dataLayout == DataLayout::NCHW) ? TensorShape{3, 2, 5, 5} : TensorShape{3, 5, 5, 2};
339 TensorShape outputShape = (dataLayout == DataLayout::NCHW) ? TensorShape{3, 2, 2, 4} : TensorShape{3, 2, 4, 2};
telsoa014fcda012018-03-09 14:13:49 +0000340
telsoa01c577f2c2018-08-31 09:22:23 +0100341 // Checks that outputs and inputs are as we expect them (see definition of CreatePooling2dWorkloadTest).
telsoa014fcda012018-03-09 14:13:49 +0000342 Pooling2dQueueDescriptor queueDescriptor = workload->GetData();
343 auto inputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
344 auto outputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
Nina Drozdb48e6862018-10-09 12:09:56 +0100345 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle, TensorInfo(inputShape, DataType)));
346 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle, TensorInfo(outputShape, DataType)));
telsoa014fcda012018-03-09 14:13:49 +0000347}
348
telsoa01c577f2c2018-08-31 09:22:23 +0100349#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
350BOOST_AUTO_TEST_CASE(CreatePooling2dFloat16Workload)
351{
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +0100352 NeonCreatePooling2dWorkloadTest<DataType::Float16>();
telsoa01c577f2c2018-08-31 09:22:23 +0100353}
354#endif
355
Nina Drozdb48e6862018-10-09 12:09:56 +0100356BOOST_AUTO_TEST_CASE(CreatePooling2dFloatNchwWorkload)
telsoa01c577f2c2018-08-31 09:22:23 +0100357{
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +0100358 NeonCreatePooling2dWorkloadTest<DataType::Float32>(DataLayout::NCHW);
telsoa01c577f2c2018-08-31 09:22:23 +0100359}
360
Nina Drozdb48e6862018-10-09 12:09:56 +0100361BOOST_AUTO_TEST_CASE(CreatePooling2dFloatNhwcWorkload)
telsoa01c577f2c2018-08-31 09:22:23 +0100362{
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +0100363 NeonCreatePooling2dWorkloadTest<DataType::Float32>(DataLayout::NHWC);
Nina Drozdb48e6862018-10-09 12:09:56 +0100364}
365
366BOOST_AUTO_TEST_CASE(CreatePooling2dUint8NchwWorkload)
367{
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +0100368 NeonCreatePooling2dWorkloadTest<DataType::QuantisedAsymm8>(DataLayout::NCHW);
Nina Drozdb48e6862018-10-09 12:09:56 +0100369}
370
371BOOST_AUTO_TEST_CASE(CreatePooling2dUint8NhwcWorkload)
372{
Nattapat Chaimanowong5d2e7002018-10-12 16:03:56 +0100373 NeonCreatePooling2dWorkloadTest<DataType::QuantisedAsymm8>(DataLayout::NHWC);
telsoa01c577f2c2018-08-31 09:22:23 +0100374}
375
Nattapat Chaimanowongcce11fc2018-10-12 16:30:56 +0100376template <typename armnn::DataType DataType>
telsoa01c577f2c2018-08-31 09:22:23 +0100377static void NeonCreateReshapeWorkloadTest()
telsoa014fcda012018-03-09 14:13:49 +0000378{
379 Graph graph;
380 NeonWorkloadFactory factory;
Nattapat Chaimanowongcce11fc2018-10-12 16:30:56 +0100381 auto workload = CreateReshapeWorkloadTest<NeonReshapeWorkload, DataType>(factory, graph);
telsoa014fcda012018-03-09 14:13:49 +0000382
telsoa01c577f2c2018-08-31 09:22:23 +0100383 // Checks that outputs and inputs are as we expect them (see definition of CreateReshapeWorkloadTest).
telsoa014fcda012018-03-09 14:13:49 +0000384 ReshapeQueueDescriptor queueDescriptor = workload->GetData();
385 auto inputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
386 auto outputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
telsoa01c577f2c2018-08-31 09:22:23 +0100387 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle, TensorInfo({4, 1}, DataType)));
388 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle, TensorInfo({1, 4}, DataType)));
telsoa014fcda012018-03-09 14:13:49 +0000389}
390
telsoa01c577f2c2018-08-31 09:22:23 +0100391#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
392BOOST_AUTO_TEST_CASE(CreateReshapeFloat16Workload)
393{
Nattapat Chaimanowongcce11fc2018-10-12 16:30:56 +0100394 NeonCreateReshapeWorkloadTest<DataType::Float16>();
telsoa01c577f2c2018-08-31 09:22:23 +0100395}
396#endif
397
arovir019e53a352018-08-31 15:26:35 +0100398BOOST_AUTO_TEST_CASE(CreateReshapeFloatWorkload)
telsoa014fcda012018-03-09 14:13:49 +0000399{
Nattapat Chaimanowongcce11fc2018-10-12 16:30:56 +0100400 NeonCreateReshapeWorkloadTest<DataType::Float32>();
telsoa014fcda012018-03-09 14:13:49 +0000401}
402
403BOOST_AUTO_TEST_CASE(CreateReshapeUint8Workload)
404{
Nattapat Chaimanowongcce11fc2018-10-12 16:30:56 +0100405 NeonCreateReshapeWorkloadTest<DataType::QuantisedAsymm8>();
telsoa014fcda012018-03-09 14:13:49 +0000406}
407
telsoa01c577f2c2018-08-31 09:22:23 +0100408template <typename SoftmaxWorkloadType, typename armnn::DataType DataType>
409static void NeonCreateSoftmaxWorkloadTest()
telsoa014fcda012018-03-09 14:13:49 +0000410{
411 Graph graph;
412 NeonWorkloadFactory factory;
telsoa01c577f2c2018-08-31 09:22:23 +0100413 auto workload = CreateSoftmaxWorkloadTest<SoftmaxWorkloadType, DataType>(factory, graph);
telsoa014fcda012018-03-09 14:13:49 +0000414
telsoa01c577f2c2018-08-31 09:22:23 +0100415 // Checks that outputs and inputs are as we expect them (see definition of CreateSoftmaxWorkloadTest).
telsoa014fcda012018-03-09 14:13:49 +0000416 SoftmaxQueueDescriptor queueDescriptor = workload->GetData();
417 auto inputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
418 auto outputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
telsoa01c577f2c2018-08-31 09:22:23 +0100419 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle, TensorInfo({4, 1}, DataType)));
420 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle, TensorInfo({4, 1}, DataType)));
421}
422
423#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
424BOOST_AUTO_TEST_CASE(CreateSoftmaxFloat16Workload)
425{
arovir019e53a352018-08-31 15:26:35 +0100426 NeonCreateSoftmaxWorkloadTest<NeonSoftmaxFloatWorkload, DataType::Float16>();
telsoa01c577f2c2018-08-31 09:22:23 +0100427}
428#endif
429
arovir019e53a352018-08-31 15:26:35 +0100430BOOST_AUTO_TEST_CASE(CreateSoftmaxFloatWorkload)
telsoa01c577f2c2018-08-31 09:22:23 +0100431{
arovir019e53a352018-08-31 15:26:35 +0100432 NeonCreateSoftmaxWorkloadTest<NeonSoftmaxFloatWorkload, DataType::Float32>();
telsoa014fcda012018-03-09 14:13:49 +0000433}
434
435BOOST_AUTO_TEST_CASE(CreateSplitterWorkload)
436{
437 Graph graph;
438 NeonWorkloadFactory factory;
Nattapat Chaimanowong14766d72018-10-12 15:09:53 +0100439 auto workload = CreateSplitterWorkloadTest<NeonSplitterWorkload, DataType::Float32>(factory, graph);
telsoa014fcda012018-03-09 14:13:49 +0000440
telsoa01c577f2c2018-08-31 09:22:23 +0100441 // Checks that outputs are as we expect them (see definition of CreateSplitterWorkloadTest).
telsoa014fcda012018-03-09 14:13:49 +0000442 SplitterQueueDescriptor queueDescriptor = workload->GetData();
443 auto inputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
surmeh013537c2c2018-05-18 16:31:43 +0100444 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle, TensorInfo({5, 7, 7}, DataType::Float32)));
445
telsoa014fcda012018-03-09 14:13:49 +0000446 auto outputHandle0 = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
surmeh013537c2c2018-05-18 16:31:43 +0100447 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle0, TensorInfo({1, 7, 7}, DataType::Float32)));
448
telsoa014fcda012018-03-09 14:13:49 +0000449 auto outputHandle1 = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[1]);
surmeh013537c2c2018-05-18 16:31:43 +0100450 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle1, TensorInfo({2, 7, 7}, DataType::Float32)));
451
telsoa014fcda012018-03-09 14:13:49 +0000452 auto outputHandle2 = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[2]);
surmeh013537c2c2018-05-18 16:31:43 +0100453 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle2, TensorInfo({2, 7, 7}, DataType::Float32)));
telsoa014fcda012018-03-09 14:13:49 +0000454}
455
456BOOST_AUTO_TEST_CASE(CreateSplitterMerger)
457{
telsoa01c577f2c2018-08-31 09:22:23 +0100458 // Tests that it is possible to decide which output of the splitter layer
459 // should be lined to which input of the merger layer.
460 // We tested that is is possible to specify 0th output
461 // of the splitter to be the 1st input to the merger, and the 1st output of the splitter to be 0th input
telsoa014fcda012018-03-09 14:13:49 +0000462 // of the merger.
463
464 Graph graph;
465 NeonWorkloadFactory factory;
466
467 auto workloads =
Nattapat Chaimanowong14766d72018-10-12 15:09:53 +0100468 CreateSplitterMergerWorkloadTest<NeonSplitterWorkload, NeonMergerWorkload,
telsoa01c577f2c2018-08-31 09:22:23 +0100469 DataType::Float32>(factory, graph);
telsoa014fcda012018-03-09 14:13:49 +0000470
471 auto wlSplitter = std::move(workloads.first);
472 auto wlMerger = std::move(workloads.second);
473
telsoa01c577f2c2018-08-31 09:22:23 +0100474 //Checks that the index of inputs/outputs matches what we declared on InputDescriptor construction.
telsoa014fcda012018-03-09 14:13:49 +0000475 armnn::INeonTensorHandle* sOut0 = dynamic_cast<armnn::INeonTensorHandle*>(wlSplitter->GetData().m_Outputs[0]);
476 armnn::INeonTensorHandle* sOut1 = dynamic_cast<armnn::INeonTensorHandle*>(wlSplitter->GetData().m_Outputs[1]);
477 armnn::INeonTensorHandle* mIn0 = dynamic_cast<armnn::INeonTensorHandle*>(wlMerger->GetData().m_Inputs[0]);
478 armnn::INeonTensorHandle* mIn1 = dynamic_cast<armnn::INeonTensorHandle*>(wlMerger->GetData().m_Inputs[1]);
479
480 BOOST_TEST(sOut0);
481 BOOST_TEST(sOut1);
482 BOOST_TEST(mIn0);
483 BOOST_TEST(mIn1);
484
485 bool validDataPointers = (sOut0 == mIn1) && (sOut1 == mIn0);
486
487 BOOST_TEST(validDataPointers);
488}
489
490BOOST_AUTO_TEST_CASE(CreateSingleOutputMultipleInputs)
491{
telsoa01c577f2c2018-08-31 09:22:23 +0100492 // Tests that it is possible to assign multiple (two) different layers to each of the outputs of a splitter layer.
493 // We created a splitter with two outputs. That each of those outputs is used by two different activation layers
telsoa014fcda012018-03-09 14:13:49 +0000494
495 Graph graph;
496 NeonWorkloadFactory factory;
Nattapat Chaimanowong14766d72018-10-12 15:09:53 +0100497 std::unique_ptr<NeonSplitterWorkload> wlSplitter;
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +0100498 std::unique_ptr<NeonActivationWorkload> wlActiv0_0;
499 std::unique_ptr<NeonActivationWorkload> wlActiv0_1;
500 std::unique_ptr<NeonActivationWorkload> wlActiv1_0;
501 std::unique_ptr<NeonActivationWorkload> wlActiv1_1;
telsoa014fcda012018-03-09 14:13:49 +0000502
Nattapat Chaimanowong14766d72018-10-12 15:09:53 +0100503 CreateSplitterMultipleInputsOneOutputWorkloadTest<NeonSplitterWorkload,
Nattapat Chaimanowongd4b70592018-10-12 11:21:49 +0100504 NeonActivationWorkload, DataType::Float32>(factory, graph, wlSplitter, wlActiv0_0, wlActiv0_1,
505 wlActiv1_0, wlActiv1_1);
telsoa014fcda012018-03-09 14:13:49 +0000506
507 armnn::INeonTensorHandle* sOut0 = dynamic_cast<armnn::INeonTensorHandle*>(wlSplitter->GetData().m_Outputs[0]);
508 armnn::INeonTensorHandle* sOut1 = dynamic_cast<armnn::INeonTensorHandle*>(wlSplitter->GetData().m_Outputs[1]);
509 armnn::INeonTensorHandle* activ0_0Im = dynamic_cast<armnn::INeonTensorHandle*>(wlActiv0_0->GetData().m_Inputs[0]);
510 armnn::INeonTensorHandle* activ0_1Im = dynamic_cast<armnn::INeonTensorHandle*>(wlActiv0_1->GetData().m_Inputs[0]);
511 armnn::INeonTensorHandle* activ1_0Im = dynamic_cast<armnn::INeonTensorHandle*>(wlActiv1_0->GetData().m_Inputs[0]);
512 armnn::INeonTensorHandle* activ1_1Im = dynamic_cast<armnn::INeonTensorHandle*>(wlActiv1_1->GetData().m_Inputs[0]);
513
514
515 BOOST_TEST(sOut0);
516 BOOST_TEST(sOut1);
517 BOOST_TEST(activ0_0Im);
518 BOOST_TEST(activ0_1Im);
519 BOOST_TEST(activ1_0Im);
520 BOOST_TEST(activ1_1Im);
521
522 bool validDataPointers = (sOut0 == activ0_0Im) && (sOut0 == activ0_1Im) &&
523 (sOut1 == activ1_0Im) && (sOut1 == activ1_1Im);
524
525 BOOST_TEST(validDataPointers);
526}
527
528BOOST_AUTO_TEST_CASE(CreateMemCopyWorkloadsNeon)
529{
530 NeonWorkloadFactory factory;
telsoa01c577f2c2018-08-31 09:22:23 +0100531 CreateMemCopyWorkloads<INeonTensorHandle>(factory);
telsoa014fcda012018-03-09 14:13:49 +0000532}
533
Matteo Martincighbcd3c852018-09-28 14:14:12 +0100534template <typename L2NormalizationWorkloadType, typename armnn::DataType DataType>
535static void NeonCreateL2NormalizationWorkloadTest(DataLayout dataLayout)
536{
Matteo Martincigh2400b6d2018-10-09 18:19:20 +0100537 Graph graph;
538 NeonWorkloadFactory factory;
539 auto workload =
540 CreateL2NormalizationWorkloadTest<L2NormalizationWorkloadType, DataType>(factory, graph, dataLayout);
Matteo Martincighbcd3c852018-09-28 14:14:12 +0100541
542 // Checks that inputs/outputs are as we expect them (see definition of CreateNormalizationWorkloadTest).
543 L2NormalizationQueueDescriptor queueDescriptor = workload->GetData();
544 auto inputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Inputs[0]);
545 auto outputHandle = boost::polymorphic_downcast<INeonTensorHandle*>(queueDescriptor.m_Outputs[0]);
Matteo Martincigh2400b6d2018-10-09 18:19:20 +0100546
547 TensorShape inputShape = (dataLayout == DataLayout::NCHW) ?
548 TensorShape{ 5, 20, 50, 67 } : TensorShape{ 5, 50, 67, 20 };
549 TensorShape outputShape = (dataLayout == DataLayout::NCHW) ?
550 TensorShape{ 5, 20, 50, 67 } : TensorShape{ 5, 50, 67, 20 };
551
552 BOOST_TEST(TestNeonTensorHandleInfo(inputHandle, TensorInfo(inputShape, DataType)));
553 BOOST_TEST(TestNeonTensorHandleInfo(outputHandle, TensorInfo(outputShape, DataType)));
Matteo Martincighbcd3c852018-09-28 14:14:12 +0100554}
555
556#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
557BOOST_AUTO_TEST_CASE(CreateL2NormalizationFloat16NchwWorkload)
558{
559 NeonCreateL2NormalizationWorkloadTest<NeonL2NormalizationFloatWorkload, DataType::Float16>(DataLayout::NCHW);
560}
561
562BOOST_AUTO_TEST_CASE(CreateL2NormalizationFloat16NhwcWorkload)
563{
564 NeonCreateL2NormalizationWorkloadTest<NeonL2NormalizationFloatWorkload, DataType::Float16>(DataLayout::NHWC);
565}
566#endif
567
568BOOST_AUTO_TEST_CASE(CreateL2NormalizationNchwWorkload)
569{
570 NeonCreateL2NormalizationWorkloadTest<NeonL2NormalizationFloatWorkload, DataType::Float32>(DataLayout::NCHW);
571}
572
573BOOST_AUTO_TEST_CASE(CreateL2NormalizationNhwcWorkload)
574{
575 NeonCreateL2NormalizationWorkloadTest<NeonL2NormalizationFloatWorkload, DataType::Float32>(DataLayout::NHWC);
576}
577
telsoa014fcda012018-03-09 14:13:49 +0000578BOOST_AUTO_TEST_SUITE_END()