blob: 36f1cd98de8445130c554f8efc5668850cd681c1 [file] [log] [blame]
Derek Lamberti6a5e5e82019-12-05 14:41:20 +00001//
2// Copyright © 2019 Arm Ltd. All rights reserved.
3// SPDX-License-Identifier: MIT
4//
5
6#include "NeonDetectionPostProcessWorkload.hpp"
7
8#include "NeonWorkloadUtils.hpp"
9
10#include <aclCommon/ArmComputeTensorHandle.hpp>
11#include <aclCommon/ArmComputeTensorUtils.hpp>
Jan Eilersbb446e52020-04-02 13:56:54 +010012#include <armnn/utility/PolymorphicDowncast.hpp>
Derek Lamberti6a5e5e82019-12-05 14:41:20 +000013
14namespace armnn
15{
16
17arm_compute::DetectionPostProcessLayerInfo MakeInfo(const DetectionPostProcessDescriptor& desc)
18{
19 return arm_compute::DetectionPostProcessLayerInfo(desc.m_MaxDetections,
20 desc.m_MaxClassesPerDetection,
21 desc.m_NmsScoreThreshold,
22 desc.m_NmsIouThreshold,
23 desc.m_NumClasses,
24 { desc.m_ScaleX,
25 desc.m_ScaleY,
26 desc.m_ScaleW,
27 desc.m_ScaleH },
28 desc.m_UseRegularNms,
29 desc.m_DetectionsPerClass);
30}
31
32arm_compute::Status NeonDetectionPostProcessValidate(const TensorInfo& boxEncodings,
33 const TensorInfo& scores,
34 const TensorInfo& anchors,
35 const TensorInfo& detectionBoxes,
36 const TensorInfo& detectionClasses,
37 const TensorInfo& detectionScores,
38 const TensorInfo& numDetections,
39 const DetectionPostProcessDescriptor &desc)
40{
41 arm_compute::DetectionPostProcessLayerInfo info = MakeInfo(desc);
42
43 const arm_compute::TensorInfo aclBoxEncodings =
44 armcomputetensorutils::BuildArmComputeTensorInfo(boxEncodings);
45
46 const arm_compute::TensorInfo aclScores =
47 armcomputetensorutils::BuildArmComputeTensorInfo(scores);
48
49 const arm_compute::TensorInfo aclAnchors =
50 armcomputetensorutils::BuildArmComputeTensorInfo(anchors);
51
52 arm_compute::TensorInfo aclDetectionBoxes =
53 armcomputetensorutils::BuildArmComputeTensorInfo(detectionBoxes);
54
55 arm_compute::TensorInfo aclDetectionClasses =
56 armcomputetensorutils::BuildArmComputeTensorInfo(detectionClasses);
57
58 arm_compute::TensorInfo aclDetectionScores =
59 armcomputetensorutils::BuildArmComputeTensorInfo(detectionScores);
60
61 arm_compute::TensorInfo aclNumDetections =
62 armcomputetensorutils::BuildArmComputeTensorInfo(numDetections);
63
James Conroy99bf80d2020-02-20 11:14:49 +000064 return arm_compute::NEDetectionPostProcessLayer::validate(
Derek Lamberti6a5e5e82019-12-05 14:41:20 +000065 &aclBoxEncodings,
66 &aclScores,
67 &aclAnchors,
68 &aclDetectionBoxes,
69 &aclDetectionClasses,
70 &aclDetectionScores,
71 &aclNumDetections,
72 info);
73}
74
75NeonDetectionPostProcessWorkload::NeonDetectionPostProcessWorkload(
76 const DetectionPostProcessQueueDescriptor& descriptor,
77 const WorkloadInfo& info)
78 : BaseWorkload<DetectionPostProcessQueueDescriptor>(descriptor, info)
79{
80 m_Anchors = std::make_unique<arm_compute::Tensor>();
81 BuildArmComputeTensor(*m_Anchors, descriptor.m_Anchors->GetTensorInfo());
82
83 arm_compute::DetectionPostProcessLayerInfo di = MakeInfo(m_Data.m_Parameters);
84
85 auto AclTensorRef = [](ITensorHandle* tensor) -> arm_compute::ITensor&
86 {
Jan Eilersbb446e52020-04-02 13:56:54 +010087 return PolymorphicDowncast<IAclTensorHandle*>(tensor)->GetTensor();
Derek Lamberti6a5e5e82019-12-05 14:41:20 +000088 };
89
90 arm_compute::ITensor& boxEncodings = AclTensorRef(m_Data.m_Inputs[0]);
91 arm_compute::ITensor& scores = AclTensorRef(m_Data.m_Inputs[1]);
92
93 arm_compute::ITensor& detectionBoxes = AclTensorRef(m_Data.m_Outputs[0]);
94 arm_compute::ITensor& detectionClasses = AclTensorRef(m_Data.m_Outputs[1]);
95 arm_compute::ITensor& detectionScores = AclTensorRef(m_Data.m_Outputs[2]);
96 arm_compute::ITensor& numDetections = AclTensorRef(m_Data.m_Outputs[3]);
97
98 m_Func.configure(&boxEncodings, &scores, m_Anchors.get(),
99 &detectionBoxes, &detectionClasses, &detectionScores, &numDetections,
100 di);
101
102 InitializeArmComputeTensorData(*m_Anchors, m_Data.m_Anchors);
103}
104
105void NeonDetectionPostProcessWorkload::Execute() const
106{
107 ARMNN_SCOPED_PROFILING_EVENT_NEON("NeonDetectionPostProcessWorkload_Execute");
108 m_Func.run();
109}
110
111} // namespace armnn