blob: c30782232525907c0c83d7eba5c4453314cf185e [file] [log] [blame]
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +01001//
Mike Kelly7cbe7812023-07-25 17:37:33 +01002// Copyright © 2019-2023 Arm Ltd and Contributors. All rights reserved.
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +01003// SPDX-License-Identifier: MIT
4//
5
6#include "NeonSplitterWorkload.hpp"
7
Matthew Bentham5e98b012020-01-24 23:11:43 +00008#include <arm_compute/runtime/NEON/functions/NESplit.h>
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +01009
10#include <aclCommon/ArmComputeTensorUtils.hpp>
11#include <aclCommon/ArmComputeUtils.hpp>
Jan Eilersbb446e52020-04-02 13:56:54 +010012#include <armnn/utility/PolymorphicDowncast.hpp>
Colm Donelan0c479742021-12-10 12:43:54 +000013#include <armnn/backends/TensorHandle.hpp>
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010014#include <neon/NeonTensorHandle.hpp>
15
Matthew Bentham5e98b012020-01-24 23:11:43 +000016#include "NeonWorkloadUtils.hpp"
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010017
18namespace armnn
19{
20
21using namespace armcomputetensorutils;
22
23namespace
24{
25unsigned int CalcAclAxis(unsigned int numDimensions, unsigned int splitAxis)
26{
27 return (numDimensions - splitAxis) - 1;
28}
29
30} //namespace
31
32arm_compute::Status NeonSplitterWorkloadValidate(const TensorInfo& input,
33 const std::vector<std::reference_wrapper<TensorInfo>>& outputs,
34 unsigned int splitAxis)
35{
36 const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input);
37
38 size_t numOutputs = outputs.size();
39
40 std::vector<arm_compute::TensorInfo> aclOutputs;
41 aclOutputs.reserve(numOutputs);
42
43 std::vector<arm_compute::ITensorInfo*> aclOutputPtr;
44 aclOutputPtr.reserve(numOutputs);
45
46 for (size_t i = 0u; i < outputs.size(); ++i)
47 {
48 aclOutputs.emplace_back(BuildArmComputeTensorInfo(outputs[i]));
49 aclOutputPtr.emplace_back(&aclOutputs.back());
50 }
51
52 unsigned int aclAxis = CalcAclAxis(input.GetNumDimensions(), splitAxis);
53 return arm_compute::NESplit::validate(&aclInputInfo, aclOutputPtr, aclAxis);
54}
55
56NeonSplitterWorkload::NeonSplitterWorkload(const SplitterQueueDescriptor& descriptor, const WorkloadInfo& info)
Teresa Charlin588cbdf2022-01-19 15:55:37 +000057 : NeonBaseWorkload<SplitterQueueDescriptor>(descriptor, info)
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010058{
Keith Davis2d0679f2021-08-05 11:35:00 +010059 // Report Profiling Details
60 ARMNN_REPORT_PROFILING_WORKLOAD_DESC("NeonSplitterWorkload_Construct",
61 descriptor.m_Parameters,
62 info,
63 this->GetGuid());
64
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010065 bool allOutputsAreSubtensors = true;
66
67 // Check that all outputs are sub-tensors
68 for (auto output : m_Data.m_Outputs)
69 {
70 if (output && !output->GetParent())
71 {
72 // Non sub-tensor input found so we need to execute the split function
73 allOutputsAreSubtensors = false;
74 break;
75 }
76 }
77
78 if (allOutputsAreSubtensors)
79 {
80 // Can skip configuring the split function since it's not executed
81 return;
82 }
83
Jan Eilersbb446e52020-04-02 13:56:54 +010084 arm_compute::ITensor& input = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010085
86 std::vector<arm_compute::ITensor *> aclOutputs;
87 for (auto output : m_Data.m_Outputs)
88 {
Jan Eilers3c9e0452020-04-10 13:00:44 +010089 arm_compute::ITensor& aclOutput = PolymorphicPointerDowncast<IAclTensorHandle>(output)->GetTensor();
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010090 aclOutputs.emplace_back(&aclOutput);
91 }
92
93 // Create the layer function
Matthew Bentham5e98b012020-01-24 23:11:43 +000094 std::unique_ptr<arm_compute::NESplit> layer(new arm_compute::NESplit());
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +010095
96 // Configure input and output tensors
97 std::set<unsigned int> splitAxis = ComputeSplitAxis(descriptor.m_Parameters, m_Data.m_Inputs[0]->GetShape());
98 if (splitAxis.size() != 1)
99 {
100 throw InvalidArgumentException("Cannot derive split axis from SplitterDescriptor");
101 }
102
103 unsigned int aclAxis = CalcAclAxis(descriptor.m_Parameters.GetNumDimensions(), *splitAxis.begin());
Matthew Bentham5e98b012020-01-24 23:11:43 +0000104 layer->configure(&input, aclOutputs, aclAxis);
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +0100105
106 // Prepare
Matthew Bentham5e98b012020-01-24 23:11:43 +0000107 layer->prepare();
108 m_Layer.reset(layer.release());
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +0100109}
110
111void NeonSplitterWorkload::Execute() const
112{
113 if (m_Layer)
114 {
Mike Kelly7cbe7812023-07-25 17:37:33 +0100115 ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID("NeonSplitterWorkload_Execute");
Narumol Prangnawarat15eb5832019-05-20 15:31:05 +0100116 m_Layer->run();
117 }
118}
119
120} //namespace armnn
121