blob: ec0dd30275ce63df88a5abbb7730b6bc3a349a0d [file] [log] [blame]
telsoa01c577f2c2018-08-31 09:22:23 +01001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa01c577f2c2018-08-31 09:22:23 +01004//
5
David Beck0a710c42018-09-11 15:21:14 +01006#include "ClAdditionWorkload.hpp"
telsoa01c577f2c2018-08-31 09:22:23 +01007
David Beckac42efd2018-09-26 17:41:13 +01008#include <backends/cl/ClTensorHandle.hpp>
David Beck711fa312018-09-24 10:46:38 +01009#include <backends/CpuTensorHandle.hpp>
10#include <backends/aclCommon/ArmComputeTensorUtils.hpp>
telsoa01c577f2c2018-08-31 09:22:23 +010011
Matthew Bentham14e46692018-09-20 15:35:30 +010012#include "ClWorkloadUtils.hpp"
13
telsoa01c577f2c2018-08-31 09:22:23 +010014namespace armnn
15{
16using namespace armcomputetensorutils;
17
18static constexpr arm_compute::ConvertPolicy g_AclConvertPolicy = arm_compute::ConvertPolicy::SATURATE;
19
20template <armnn::DataType... T>
David Beck0a710c42018-09-11 15:21:14 +010021ClAdditionWorkload<T...>::ClAdditionWorkload(const AdditionQueueDescriptor& descriptor,
telsoa01c577f2c2018-08-31 09:22:23 +010022 const WorkloadInfo& info)
23 : TypedWorkload<AdditionQueueDescriptor, T...>(descriptor, info)
24{
David Beck0a710c42018-09-11 15:21:14 +010025 this->m_Data.ValidateInputsOutputs("ClAdditionWorkload", 2, 1);
telsoa01c577f2c2018-08-31 09:22:23 +010026
27 arm_compute::ICLTensor& input0 = static_cast<IClTensorHandle*>(this->m_Data.m_Inputs[0])->GetTensor();
28 arm_compute::ICLTensor& input1 = static_cast<IClTensorHandle*>(this->m_Data.m_Inputs[1])->GetTensor();
29 arm_compute::ICLTensor& output = static_cast<IClTensorHandle*>(this->m_Data.m_Outputs[0])->GetTensor();
30 m_Layer.configure(&input0, &input1, &output, g_AclConvertPolicy);
31}
32
33template <armnn::DataType... T>
David Beck0a710c42018-09-11 15:21:14 +010034void ClAdditionWorkload<T...>::Execute() const
telsoa01c577f2c2018-08-31 09:22:23 +010035{
David Beck0a710c42018-09-11 15:21:14 +010036 ARMNN_SCOPED_PROFILING_EVENT_CL("ClAdditionWorkload_Execute");
telsoa01c577f2c2018-08-31 09:22:23 +010037 m_Layer.run();
38}
39
arovir01085f0a42018-10-08 14:48:19 +010040arm_compute::Status ClAdditionValidate(const TensorInfo& input0,
41 const TensorInfo& input1,
42 const TensorInfo& output)
telsoa01c577f2c2018-08-31 09:22:23 +010043{
telsoa01c577f2c2018-08-31 09:22:23 +010044 const arm_compute::TensorInfo aclInput0Info = BuildArmComputeTensorInfo(input0);
45 const arm_compute::TensorInfo aclInput1Info = BuildArmComputeTensorInfo(input1);
46 const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output);
47
48 const arm_compute::Status aclStatus = arm_compute::CLArithmeticAddition::validate(&aclInput0Info,
49 &aclInput1Info,
50 &aclOutputInfo,
51 g_AclConvertPolicy);
52
arovir01085f0a42018-10-08 14:48:19 +010053 return aclStatus;
telsoa01c577f2c2018-08-31 09:22:23 +010054}
55
56} //namespace armnn
57
David Beck0a710c42018-09-11 15:21:14 +010058template class armnn::ClAdditionWorkload<armnn::DataType::Float16, armnn::DataType::Float32>;
59template class armnn::ClAdditionWorkload<armnn::DataType::QuantisedAsymm8>;