blob: df6c39a10b30d8cb62f638318f202db6a08c10c2 [file] [log] [blame]
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +01001//
Mike Kelly7cbe7812023-07-25 17:37:33 +01002// Copyright © 2019-2023 Arm Ltd and Contributors. All rights reserved.
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +01003// SPDX-License-Identifier: MIT
4//
5
6#include "NeonRsqrtWorkload.hpp"
7
8#include "NeonWorkloadUtils.hpp"
9
10#include <aclCommon/ArmComputeTensorHandle.hpp>
11#include <aclCommon/ArmComputeTensorUtils.hpp>
Jan Eilersbb446e52020-04-02 13:56:54 +010012#include <armnn/utility/PolymorphicDowncast.hpp>
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +010013
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +010014
15namespace armnn
16{
17
18arm_compute::Status NeonRsqrtWorkloadValidate(const TensorInfo& input, const TensorInfo& output)
19{
20 const arm_compute::TensorInfo aclInput = armcomputetensorutils::BuildArmComputeTensorInfo(input);
21 const arm_compute::TensorInfo aclOutput = armcomputetensorutils::BuildArmComputeTensorInfo(output);
22
23 return arm_compute::NERsqrtLayer::validate(&aclInput, &aclOutput);
24}
25
26NeonRsqrtWorkload::NeonRsqrtWorkload(const RsqrtQueueDescriptor& descriptor, const WorkloadInfo& info)
Teresa Charlin588cbdf2022-01-19 15:55:37 +000027 : NeonBaseWorkload<RsqrtQueueDescriptor>(descriptor, info)
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +010028{
29 m_Data.ValidateInputsOutputs("NeonRsqrtWorkload", 1, 1);
30
Jan Eilersbb446e52020-04-02 13:56:54 +010031 arm_compute::ITensor& input = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
32 arm_compute::ITensor& output = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +010033
34 m_RsqrtLayer.configure(&input, &output);
35}
36
37void NeonRsqrtWorkload::Execute() const
38{
Mike Kelly7cbe7812023-07-25 17:37:33 +010039 ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID("NeonRsqrtWorkload_Execute");
Aron Virginas-Tar0dd3b432019-09-10 13:55:09 +010040 m_RsqrtLayer.run();
41}
42
43} // namespace armnn