xref: /aosp_15_r20/external/armnn/src/backends/neon/workloads/NeonDetectionPostProcessWorkload.cpp (revision 89c4ff92f2867872bb9e2354d150bf0c8c502810)
1 //
2 // Copyright © 2019 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 
6 #include "NeonDetectionPostProcessWorkload.hpp"
7 
8 #include "NeonWorkloadUtils.hpp"
9 
10 #include <aclCommon/ArmComputeTensorHandle.hpp>
11 #include <aclCommon/ArmComputeTensorUtils.hpp>
12 #include <armnn/utility/PolymorphicDowncast.hpp>
13 
14 namespace armnn
15 {
16 
MakeInfo(const DetectionPostProcessDescriptor & descriptor)17 arm_compute::DetectionPostProcessLayerInfo MakeInfo(const DetectionPostProcessDescriptor& descriptor)
18 {
19     return arm_compute::DetectionPostProcessLayerInfo(descriptor.m_MaxDetections,
20                                                       descriptor.m_MaxClassesPerDetection,
21                                                       descriptor.m_NmsScoreThreshold,
22                                                       descriptor.m_NmsIouThreshold,
23                                                       descriptor.m_NumClasses,
24                                                       { descriptor.m_ScaleX,
25                                                         descriptor.m_ScaleY,
26                                                         descriptor.m_ScaleW,
27                                                         descriptor.m_ScaleH },
28                                                       descriptor.m_UseRegularNms,
29                                                       descriptor.m_DetectionsPerClass);
30 }
31 
NeonDetectionPostProcessValidate(const TensorInfo & boxEncodings,const TensorInfo & scores,const TensorInfo & anchors,const TensorInfo & detectionBoxes,const TensorInfo & detectionClasses,const TensorInfo & detectionScores,const TensorInfo & numDetections,const DetectionPostProcessDescriptor & descriptor)32 arm_compute::Status NeonDetectionPostProcessValidate(const TensorInfo& boxEncodings,
33                                                      const TensorInfo& scores,
34                                                      const TensorInfo& anchors,
35                                                      const TensorInfo& detectionBoxes,
36                                                      const TensorInfo& detectionClasses,
37                                                      const TensorInfo& detectionScores,
38                                                      const TensorInfo& numDetections,
39                                                      const DetectionPostProcessDescriptor &descriptor)
40 {
41     arm_compute::DetectionPostProcessLayerInfo info = MakeInfo(descriptor);
42 
43     const arm_compute::TensorInfo aclBoxEncodings =
44         armcomputetensorutils::BuildArmComputeTensorInfo(boxEncodings);
45 
46     const arm_compute::TensorInfo aclScores =
47         armcomputetensorutils::BuildArmComputeTensorInfo(scores);
48 
49     const arm_compute::TensorInfo aclAnchors =
50         armcomputetensorutils::BuildArmComputeTensorInfo(anchors);
51 
52     arm_compute::TensorInfo aclDetectionBoxes =
53         armcomputetensorutils::BuildArmComputeTensorInfo(detectionBoxes);
54 
55     arm_compute::TensorInfo aclDetectionClasses =
56         armcomputetensorutils::BuildArmComputeTensorInfo(detectionClasses);
57 
58     arm_compute::TensorInfo aclDetectionScores =
59         armcomputetensorutils::BuildArmComputeTensorInfo(detectionScores);
60 
61     arm_compute::TensorInfo aclNumDetections =
62         armcomputetensorutils::BuildArmComputeTensorInfo(numDetections);
63 
64     return arm_compute::NEDetectionPostProcessLayer::validate(
65             &aclBoxEncodings,
66             &aclScores,
67             &aclAnchors,
68             &aclDetectionBoxes,
69             &aclDetectionClasses,
70             &aclDetectionScores,
71             &aclNumDetections,
72             info);
73 }
74 
NeonDetectionPostProcessWorkload(const DetectionPostProcessQueueDescriptor & descriptor,const WorkloadInfo & info)75 NeonDetectionPostProcessWorkload::NeonDetectionPostProcessWorkload(
76     const DetectionPostProcessQueueDescriptor& descriptor,
77     const WorkloadInfo& info)
78     : NeonBaseWorkload<DetectionPostProcessQueueDescriptor>(descriptor, info)
79 {
80     // Report Profiling Details
81     ARMNN_REPORT_PROFILING_WORKLOAD_DESC("NeonDetectionPostProcessWorkload_Construct",
82                                          descriptor.m_Parameters,
83                                          info,
84                                          this->GetGuid());
85 
86     m_Anchors = std::make_unique<arm_compute::Tensor>();
87     BuildArmComputeTensor(*m_Anchors, descriptor.m_Anchors->GetTensorInfo());
88 
89     arm_compute::DetectionPostProcessLayerInfo di = MakeInfo(m_Data.m_Parameters);
90 
91     auto AclTensorRef = [](ITensorHandle* tensor) -> arm_compute::ITensor&
92         {
93             return PolymorphicDowncast<IAclTensorHandle*>(tensor)->GetTensor();
94         };
95 
96     arm_compute::ITensor& boxEncodings  = AclTensorRef(m_Data.m_Inputs[0]);
97     arm_compute::ITensor& scores        = AclTensorRef(m_Data.m_Inputs[1]);
98 
99     arm_compute::ITensor& detectionBoxes    = AclTensorRef(m_Data.m_Outputs[0]);
100     arm_compute::ITensor& detectionClasses  = AclTensorRef(m_Data.m_Outputs[1]);
101     arm_compute::ITensor& detectionScores   = AclTensorRef(m_Data.m_Outputs[2]);
102     arm_compute::ITensor& numDetections     = AclTensorRef(m_Data.m_Outputs[3]);
103 
104     m_Func.configure(&boxEncodings, &scores, m_Anchors.get(),
105                      &detectionBoxes, &detectionClasses, &detectionScores, &numDetections,
106                      di);
107 
108     InitializeArmComputeTensorData(*m_Anchors, m_Data.m_Anchors);
109 }
110 
Execute() const111 void NeonDetectionPostProcessWorkload::Execute() const
112 {
113     ARMNN_SCOPED_PROFILING_EVENT_NEON_GUID("NeonDetectionPostProcessWorkload_Execute", this->GetGuid());
114     m_Func.run();
115 }
116 
117 } // namespace armnn
118