patch/latest/_neon_detection_post_process_workload_8cpp_source.html

 //

+ // Copyright © 2019-2023 Arm Ltd and Contributors. All rights reserved.

+ // SPDX-License-Identifier: MIT

+ //

+

+ #include "NeonDetectionPostProcessWorkload.hpp"

+

+ #include "NeonWorkloadUtils.hpp"

+

+ #include <aclCommon/ArmComputeTensorHandle.hpp>

+ #include <aclCommon/ArmComputeTensorUtils.hpp>

+ #include <armnn/utility/PolymorphicDowncast.hpp>

+

+ namespace armnn

+ {

+

+ arm_compute::DetectionPostProcessLayerInfo MakeInfo(const DetectionPostProcessDescriptor& descriptor)

+ {

+     return arm_compute::DetectionPostProcessLayerInfo(descriptor.m_MaxDetections,

+                                                       descriptor.m_MaxClassesPerDetection,

+                                                       descriptor.m_NmsScoreThreshold,

+                                                       descriptor.m_NmsIouThreshold,

+                                                       descriptor.m_NumClasses,

+                                                       { descriptor.m_ScaleX,

+                                                         descriptor.m_ScaleY,

+                                                         descriptor.m_ScaleW,

+                                                         descriptor.m_ScaleH },

+                                                       descriptor.m_UseRegularNms,

+                                                       descriptor.m_DetectionsPerClass);

+ }

+

+ arm_compute::Status NeonDetectionPostProcessValidate(const TensorInfo& boxEncodings,

+                                                      const TensorInfo& scores,

+                                                      const TensorInfo& anchors,

+                                                      const TensorInfo& detectionBoxes,

+                                                      const TensorInfo& detectionClasses,

+                                                      const TensorInfo& detectionScores,

+                                                      const TensorInfo& numDetections,

+                                                      const DetectionPostProcessDescriptor &descriptor)

+ {

+     arm_compute::DetectionPostProcessLayerInfo info = MakeInfo(descriptor);

+

+     const arm_compute::TensorInfo aclBoxEncodings =

+         armcomputetensorutils::BuildArmComputeTensorInfo(boxEncodings);

+

+     const arm_compute::TensorInfo aclScores =

+         armcomputetensorutils::BuildArmComputeTensorInfo(scores);

+

+     const arm_compute::TensorInfo aclAnchors =

+         armcomputetensorutils::BuildArmComputeTensorInfo(anchors);

+

+     arm_compute::TensorInfo aclDetectionBoxes =

+         armcomputetensorutils::BuildArmComputeTensorInfo(detectionBoxes);

+

+     arm_compute::TensorInfo aclDetectionClasses =

+         armcomputetensorutils::BuildArmComputeTensorInfo(detectionClasses);

+

+     arm_compute::TensorInfo aclDetectionScores =

+         armcomputetensorutils::BuildArmComputeTensorInfo(detectionScores);

+

+     arm_compute::TensorInfo aclNumDetections =

+         armcomputetensorutils::BuildArmComputeTensorInfo(numDetections);

+

+     return arm_compute::NEDetectionPostProcessLayer::validate(

+             &aclBoxEncodings,

+             &aclScores,

+             &aclAnchors,

+             &aclDetectionBoxes,

+             &aclDetectionClasses,

+             &aclDetectionScores,

+             &aclNumDetections,

+             info);

+ }

+

+ NeonDetectionPostProcessWorkload::NeonDetectionPostProcessWorkload(

+     const DetectionPostProcessQueueDescriptor& descriptor,

+     const WorkloadInfo& info)

+     : NeonBaseWorkload<DetectionPostProcessQueueDescriptor>(descriptor, info)

+ {

+     // Report Profiling Details

+     ARMNN_REPORT_PROFILING_WORKLOAD_DESC("NeonDetectionPostProcessWorkload_Construct",

+                                          descriptor.m_Parameters,

+                                          info,

+                                          this->GetGuid());

+

+     m_Anchors = std::make_unique<arm_compute::Tensor>();

+     BuildArmComputeTensor(*m_Anchors, descriptor.m_Anchors->GetTensorInfo());

+

+     arm_compute::DetectionPostProcessLayerInfo di = MakeInfo(m_Data.m_Parameters);

+

+     auto AclTensorRef = [](ITensorHandle* tensor) -> arm_compute::ITensor&

+         {

+             return PolymorphicDowncast<IAclTensorHandle*>(tensor)->GetTensor();

+         };

+

+     arm_compute::ITensor& boxEncodings  = AclTensorRef(m_Data.m_Inputs[0]);

+     arm_compute::ITensor& scores        = AclTensorRef(m_Data.m_Inputs[1]);

+

+     arm_compute::ITensor& detectionBoxes    = AclTensorRef(m_Data.m_Outputs[0]);

+     arm_compute::ITensor& detectionClasses  = AclTensorRef(m_Data.m_Outputs[1]);

+     arm_compute::ITensor& detectionScores   = AclTensorRef(m_Data.m_Outputs[2]);

+     arm_compute::ITensor& numDetections     = AclTensorRef(m_Data.m_Outputs[3]);

+

+     m_Func.configure(&boxEncodings, &scores, m_Anchors.get(),

+                      &detectionBoxes, &detectionClasses, &detectionScores, &numDetections,

+                      di);

+

+     InitializeArmComputeTensorData(*m_Anchors, m_Data.m_Anchors);

+ }

+

+ void NeonDetectionPostProcessWorkload::Execute() const

+ {

+     ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID("NeonDetectionPostProcessWorkload_Execute");

+     m_Func.run();

+ }

+

+ } // namespace armnn

+