blob: adc34e91c400d4e8c6ca27432f80cd13ddc55e5e [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5
arovir019e53a352018-08-31 15:26:35 +01006#include "NeonAdditionFloatWorkload.hpp"
telsoa01c577f2c2018-08-31 09:22:23 +01007#include "backends/ArmComputeTensorUtils.hpp"
telsoa014fcda012018-03-09 14:13:49 +00008#include "backends/CpuTensorHandle.hpp"
9
10namespace armnn
11{
12
telsoa01c577f2c2018-08-31 09:22:23 +010013arm_compute::Status NeonAdditionWorkloadValidate(const TensorInfo& input0,
14 const TensorInfo& input1,
15 const TensorInfo& output)
16{
17 const arm_compute::TensorInfo aclInput0 = armcomputetensorutils::BuildArmComputeTensorInfo(input0);
18 const arm_compute::TensorInfo aclInput1 = armcomputetensorutils::BuildArmComputeTensorInfo(input1);
19 const arm_compute::TensorInfo aclOutput = armcomputetensorutils::BuildArmComputeTensorInfo(output);
20
21 return arm_compute::NEArithmeticAddition::validate(&aclInput0,
22 &aclInput1,
23 &aclOutput,
24 arm_compute::ConvertPolicy::SATURATE);
25}
26
27
arovir019e53a352018-08-31 15:26:35 +010028NeonAdditionFloatWorkload::NeonAdditionFloatWorkload(const AdditionQueueDescriptor& descriptor,
29 const WorkloadInfo& info)
telsoa01c577f2c2018-08-31 09:22:23 +010030 : FloatWorkload<AdditionQueueDescriptor>(descriptor, info)
telsoa014fcda012018-03-09 14:13:49 +000031{
arovir019e53a352018-08-31 15:26:35 +010032 m_Data.ValidateInputsOutputs("NeonAdditionFloatWorkload", 2, 1);
telsoa014fcda012018-03-09 14:13:49 +000033
34 arm_compute::ITensor& input1 = boost::polymorphic_downcast<INeonTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
35 arm_compute::ITensor& input2 = boost::polymorphic_downcast<INeonTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();
36 arm_compute::ITensor& output = boost::polymorphic_downcast<INeonTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
37
38 m_AddLayer.configure(&input1, &input2, &output, arm_compute::ConvertPolicy::SATURATE);
39}
40
arovir019e53a352018-08-31 15:26:35 +010041void NeonAdditionFloatWorkload::Execute() const
telsoa014fcda012018-03-09 14:13:49 +000042{
arovir019e53a352018-08-31 15:26:35 +010043 ARMNN_SCOPED_PROFILING_EVENT_NEON("NeonAdditionFloatWorkload_Execute");
telsoa014fcda012018-03-09 14:13:49 +000044 m_AddLayer.run();
45}
46
47} //namespace armnn
48