blob: 2c94cb51845d79bcbcbd9b46295b1f69db30cabc [file] [log] [blame]
Teresa Charlinf540eb82020-04-10 19:24:55 +01001//
Teresa Charlin52664732020-06-29 16:27:03 +01002// Copyright © 2020 Arm Ltd and Contributors. All rights reserved.
Teresa Charlinf540eb82020-04-10 19:24:55 +01003// SPDX-License-Identifier: MIT
4//
5
6#include "NeonGatherWorkload.hpp"
7#include "NeonWorkloadUtils.hpp"
8#include <armnn/utility/PolymorphicDowncast.hpp>
9#include <aclCommon/ArmComputeUtils.hpp>
10
11namespace armnn
12{
13arm_compute::Status NeonGatherWorkloadValidate(const TensorInfo& input,
14 const TensorInfo& indices,
Teresa Charlin52664732020-06-29 16:27:03 +010015 const TensorInfo& output,
16 const GatherDescriptor& descriptor)
Teresa Charlinf540eb82020-04-10 19:24:55 +010017{
18 const arm_compute::TensorInfo aclInput = BuildArmComputeTensorInfo(input);
19 const arm_compute::TensorInfo aclIndices = BuildArmComputeTensorInfo(indices);
20 const arm_compute::TensorInfo aclOutput = BuildArmComputeTensorInfo(output);
21
Teresa Charlin52664732020-06-29 16:27:03 +010022 int aclAxis = ComputeAclAxis(descriptor.m_Axis, input);
Teresa Charlinf540eb82020-04-10 19:24:55 +010023
24 return arm_compute::NEGather::validate(&aclInput, &aclIndices, &aclOutput, aclAxis);
25}
26
27NeonGatherWorkload::NeonGatherWorkload(const GatherQueueDescriptor& descriptor,
28 const WorkloadInfo& info)
29 : BaseWorkload<GatherQueueDescriptor>(descriptor, info)
30{
31 m_Data.ValidateInputsOutputs("NeonGatherWorkload", 1, 1);
32
33 arm_compute::ITensor& input = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
34 arm_compute::ITensor& indices = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();
35 arm_compute::ITensor& output = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
36
Teresa Charlin52664732020-06-29 16:27:03 +010037 int aclAxis = ComputeAclAxis(descriptor.m_Parameters.m_Axis, info.m_InputTensorInfos[0]);
Teresa Charlinf540eb82020-04-10 19:24:55 +010038
39 m_Layer.configure(&input, &indices, &output, aclAxis);
40}
41
42void NeonGatherWorkload::Execute() const
43{
44 ARMNN_SCOPED_PROFILING_EVENT_NEON("NeonGatherWorkload_Execute");
45 m_Layer.run();
46}
47} //namespace armnn