blob: 045fbb7595bb9a902b5823b40bb2c6c630c69e67 [file] [log] [blame]
Narumol Prangnawarat74135832019-05-23 15:07:33 +01001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
3// SPDX-License-Identifier: MIT
4//
5
6#include "ClSplitterWorkload.hpp"
7
8#include "ClWorkloadUtils.hpp"
9
10#include <aclCommon/ArmComputeTensorUtils.hpp>
11#include <aclCommon/ArmComputeUtils.hpp>
Matthew Bentham9b3e7382020-02-05 21:39:55 +000012#include <arm_compute/runtime/CL/functions/CLSplit.h>
Jan Eilers3c9e0452020-04-10 13:00:44 +010013#include <armnn/utility/PolymorphicDowncast.hpp>
Narumol Prangnawarat74135832019-05-23 15:07:33 +010014#include <backendsCommon/CpuTensorHandle.hpp>
15#include <cl/ClTensorHandle.hpp>
16
17
18namespace armnn
19{
20
21using namespace armcomputetensorutils;
22
23namespace
24{
25 unsigned int CalcAclAxis(unsigned int numDimensions, unsigned int splitAxis)
26 {
27 return (numDimensions - splitAxis) - 1;
28 }
29
30} //namespace
31
32arm_compute::Status ClSplitterWorkloadValidate(const TensorInfo& input,
33 const std::vector<std::reference_wrapper<TensorInfo>>& outputs,
34 unsigned int splitAxis)
35{
36 const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input);
37
38 size_t numOutputs = outputs.size();
39
40 std::vector<arm_compute::TensorInfo> aclOutputs;
41 aclOutputs.reserve(numOutputs);
42
43 std::vector<arm_compute::ITensorInfo*> aclOutputPtr;
44 aclOutputPtr.reserve(numOutputs);
45
46 for (size_t i = 0u; i < outputs.size(); ++i)
47 {
48 aclOutputs.emplace_back(BuildArmComputeTensorInfo(outputs[i]));
49 aclOutputPtr.emplace_back(&aclOutputs.back());
50 }
51
52 unsigned int aclAxis = CalcAclAxis(input.GetNumDimensions(), splitAxis);
53 return arm_compute::CLSplit::validate(&aclInputInfo, aclOutputPtr, aclAxis);
54}
55
56ClSplitterWorkload::ClSplitterWorkload(const SplitterQueueDescriptor& descriptor, const WorkloadInfo& info)
57 : BaseWorkload<SplitterQueueDescriptor>(descriptor, info)
58{
59 bool allOutputsAreSubtensors = true;
60
61 // Check that all outputs are sub-tensors
62 for (auto output : m_Data.m_Outputs)
63 {
64 if (output && !output->GetParent())
65 {
66 // Non sub-tensor input found so we need to execute the split function
67 allOutputsAreSubtensors = false;
68 break;
69 }
70 }
71
72 if (allOutputsAreSubtensors)
73 {
74 // Can skip configuring the split function since it's not executed
75 return;
76 }
77
Jan Eilers3c9e0452020-04-10 13:00:44 +010078 arm_compute::ICLTensor& input = armnn::PolymorphicPointerDowncast<IClTensorHandle>(
Narumol Prangnawarat74135832019-05-23 15:07:33 +010079 m_Data.m_Inputs[0])->GetTensor();
80
81 std::vector<arm_compute::ICLTensor *> aclOutputs;
82 for (auto output : m_Data.m_Outputs)
83 {
Jan Eilers3c9e0452020-04-10 13:00:44 +010084 arm_compute::ICLTensor& aclOutput = armnn::PolymorphicPointerDowncast<IClTensorHandle>(output)->GetTensor();
Narumol Prangnawarat74135832019-05-23 15:07:33 +010085 aclOutputs.emplace_back(&aclOutput);
86 }
87
88 // Create the layer function
Narumol Prangnawarat74135832019-05-23 15:07:33 +010089
90 // Configure input and output tensors
91 std::set<unsigned int> splitAxis = ComputeSplitAxis(descriptor.m_Parameters, m_Data.m_Inputs[0]->GetShape());
92 if (splitAxis.size() != 1)
93 {
94 throw InvalidArgumentException("Cannot derive split axis from SplitterDescriptor");
95 }
96
97 unsigned int aclAxis = CalcAclAxis(descriptor.m_Parameters.GetNumDimensions(), *splitAxis.begin());
Matthew Bentham9b3e7382020-02-05 21:39:55 +000098 auto layer = std::make_unique<arm_compute::CLSplit>();
99 layer->configure(&input, aclOutputs, aclAxis);
Narumol Prangnawarat74135832019-05-23 15:07:33 +0100100
101 // Prepare
Matthew Bentham9b3e7382020-02-05 21:39:55 +0000102 layer->prepare();
103
104 m_Layer = std::move(layer);
Narumol Prangnawarat74135832019-05-23 15:07:33 +0100105}
106
107void ClSplitterWorkload::Execute() const
108{
109 if (m_Layer)
110 {
111 ARMNN_SCOPED_PROFILING_EVENT_CL("ClSplitterWorkload_Execute");
112 m_Layer->run();
113 }
114}
115
116} //namespace armnn