ArmNN
 25.11
Loading...
Searching...
No Matches
NeonDetectionPostProcessWorkload.cpp
Go to the documentation of this file.
1//
2// Copyright © 2019-2023 Arm Ltd and Contributors. All rights reserved.
3// SPDX-License-Identifier: MIT
4//
5
7
9
13
14namespace armnn
15{
16
17arm_compute::DetectionPostProcessLayerInfo MakeInfo(const DetectionPostProcessDescriptor& descriptor)
18{
19 return arm_compute::DetectionPostProcessLayerInfo(descriptor.m_MaxDetections,
20 descriptor.m_MaxClassesPerDetection,
21 descriptor.m_NmsScoreThreshold,
22 descriptor.m_NmsIouThreshold,
23 descriptor.m_NumClasses,
24 { descriptor.m_ScaleX,
25 descriptor.m_ScaleY,
26 descriptor.m_ScaleW,
27 descriptor.m_ScaleH },
28 descriptor.m_UseRegularNms,
29 descriptor.m_DetectionsPerClass);
30}
31
32arm_compute::Status NeonDetectionPostProcessValidate(const TensorInfo& boxEncodings,
33 const TensorInfo& scores,
34 const TensorInfo& anchors,
35 const TensorInfo& detectionBoxes,
36 const TensorInfo& detectionClasses,
37 const TensorInfo& detectionScores,
38 const TensorInfo& numDetections,
39 const DetectionPostProcessDescriptor &descriptor)
40{
41 arm_compute::DetectionPostProcessLayerInfo info = MakeInfo(descriptor);
42
43 const arm_compute::TensorInfo aclBoxEncodings =
44 armcomputetensorutils::BuildArmComputeTensorInfo(boxEncodings);
45
46 const arm_compute::TensorInfo aclScores =
47 armcomputetensorutils::BuildArmComputeTensorInfo(scores);
48
49 const arm_compute::TensorInfo aclAnchors =
50 armcomputetensorutils::BuildArmComputeTensorInfo(anchors);
51
52 arm_compute::TensorInfo aclDetectionBoxes =
53 armcomputetensorutils::BuildArmComputeTensorInfo(detectionBoxes);
54
55 arm_compute::TensorInfo aclDetectionClasses =
56 armcomputetensorutils::BuildArmComputeTensorInfo(detectionClasses);
57
58 arm_compute::TensorInfo aclDetectionScores =
59 armcomputetensorutils::BuildArmComputeTensorInfo(detectionScores);
60
61 arm_compute::TensorInfo aclNumDetections =
62 armcomputetensorutils::BuildArmComputeTensorInfo(numDetections);
63
64 return arm_compute::NEDetectionPostProcessLayer::validate(
65 &aclBoxEncodings,
66 &aclScores,
67 &aclAnchors,
68 &aclDetectionBoxes,
69 &aclDetectionClasses,
70 &aclDetectionScores,
71 &aclNumDetections,
72 info);
73}
74
77 const WorkloadInfo& info)
79{
80 // Report Profiling Details
81 ARMNN_REPORT_PROFILING_WORKLOAD_DESC("NeonDetectionPostProcessWorkload_Construct",
82 descriptor.m_Parameters,
83 info,
84 this->GetGuid());
85
86 m_Anchors = std::make_unique<arm_compute::Tensor>();
87 BuildArmComputeTensor(*m_Anchors, descriptor.m_Anchors->GetTensorInfo());
88
89 arm_compute::DetectionPostProcessLayerInfo di = MakeInfo(m_Data.m_Parameters);
90
91 auto AclTensorRef = [](ITensorHandle* tensor) -> arm_compute::ITensor&
92 {
93 return PolymorphicDowncast<IAclTensorHandle*>(tensor)->GetTensor();
94 };
95
96 arm_compute::ITensor& boxEncodings = AclTensorRef(m_Data.m_Inputs[0]);
97 arm_compute::ITensor& scores = AclTensorRef(m_Data.m_Inputs[1]);
98
99 arm_compute::ITensor& detectionBoxes = AclTensorRef(m_Data.m_Outputs[0]);
100 arm_compute::ITensor& detectionClasses = AclTensorRef(m_Data.m_Outputs[1]);
101 arm_compute::ITensor& detectionScores = AclTensorRef(m_Data.m_Outputs[2]);
102 arm_compute::ITensor& numDetections = AclTensorRef(m_Data.m_Outputs[3]);
103
104 m_Func.configure(&boxEncodings, &scores, m_Anchors.get(),
105 &detectionBoxes, &detectionClasses, &detectionScores, &numDetections,
106 di);
107
108 InitializeArmComputeTensorData(*m_Anchors, m_Data.m_Anchors);
109}
110
112{
113 ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID("NeonDetectionPostProcessWorkload_Execute");
114 m_Func.run();
115}
116
117} // namespace armnn
#define ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID(label)
Creates a profiling event that uses GetGuid() and GetName() from the calling class.
#define ARMNN_REPORT_PROFILING_WORKLOAD_DESC(name, desc, infos, guid)
const TensorInfo & GetTensorInfo() const
NeonBaseWorkload(const DetectionPostProcessQueueDescriptor &descriptor, const WorkloadInfo &info)
NeonDetectionPostProcessWorkload(const DetectionPostProcessQueueDescriptor &descriptor, const WorkloadInfo &info)
virtual void Execute() const override
Copyright (c) 2021 ARM Limited and Contributors.
arm_compute::DetectionPostProcessLayerInfo MakeInfo(const DetectionPostProcessDescriptor &descriptor)
DestType PolymorphicDowncast(SourceType *value)
Polymorphic downcast for build in pointers only.
arm_compute::Status NeonDetectionPostProcessValidate(const TensorInfo &boxEncodings, const TensorInfo &scores, const TensorInfo &anchors, const TensorInfo &detectionBoxes, const TensorInfo &detectionClasses, const TensorInfo &detectionScores, const TensorInfo &numDetections, const DetectionPostProcessDescriptor &descriptor)
void InitializeArmComputeTensorData(arm_compute::Tensor &tensor, TensorInfo tensorInfo, const ITensorHandle *handle)
uint32_t m_NumClasses
Number of classes.
float m_NmsScoreThreshold
NMS score threshold.
float m_NmsIouThreshold
Intersection over union threshold.
uint32_t m_DetectionsPerClass
Detections per classes, used in Regular NMS.
bool m_UseRegularNms
Use Regular NMS.
uint32_t m_MaxClassesPerDetection
Maximum numbers of classes per detection, used in Fast NMS.
uint32_t m_MaxDetections
Maximum numbers of detections.
const ConstTensorHandle * m_Anchors
Contains information about TensorInfos of a layer.