plain/21.02/_neon_detection_post_process_workload_8cpp_source.xhtml

 //
 // Copyright © 2019 Arm Ltd. All rights reserved.
 // SPDX-License-Identifier: MIT
 //

 #include "NeonDetectionPostProcessWorkload.hpp"

 #include "NeonWorkloadUtils.hpp"

 #include <aclCommon/ArmComputeTensorHandle.hpp>
 #include <aclCommon/ArmComputeTensorUtils.hpp>
 #include <armnn/utility/PolymorphicDowncast.hpp>

 namespace armnn
 {

 arm_compute::DetectionPostProcessLayerInfo MakeInfo(const DetectionPostProcessDescriptor& desc)
 {
     return arm_compute::DetectionPostProcessLayerInfo(desc.m_MaxDetections,
                                                       desc.m_MaxClassesPerDetection,
                                                       desc.m_NmsScoreThreshold,
                                                       desc.m_NmsIouThreshold,
                                                       desc.m_NumClasses,
                                                       { desc.m_ScaleX,
                                                         desc.m_ScaleY,
                                                         desc.m_ScaleW,
                                                         desc.m_ScaleH },
                                                       desc.m_UseRegularNms,
                                                       desc.m_DetectionsPerClass);
 }

 arm_compute::Status NeonDetectionPostProcessValidate(const TensorInfo& boxEncodings,
                                                      const TensorInfo& scores,
                                                      const TensorInfo& anchors,
                                                      const TensorInfo& detectionBoxes,
                                                      const TensorInfo& detectionClasses,
                                                      const TensorInfo& detectionScores,
                                                      const TensorInfo& numDetections,
                                                      const DetectionPostProcessDescriptor &desc)
 {
     arm_compute::DetectionPostProcessLayerInfo info = MakeInfo(desc);

     const arm_compute::TensorInfo aclBoxEncodings =
         armcomputetensorutils::BuildArmComputeTensorInfo(boxEncodings);

     const arm_compute::TensorInfo aclScores =
         armcomputetensorutils::BuildArmComputeTensorInfo(scores);

     const arm_compute::TensorInfo aclAnchors =
         armcomputetensorutils::BuildArmComputeTensorInfo(anchors);

     arm_compute::TensorInfo aclDetectionBoxes =
         armcomputetensorutils::BuildArmComputeTensorInfo(detectionBoxes);

     arm_compute::TensorInfo aclDetectionClasses =
         armcomputetensorutils::BuildArmComputeTensorInfo(detectionClasses);

     arm_compute::TensorInfo aclDetectionScores =
         armcomputetensorutils::BuildArmComputeTensorInfo(detectionScores);

     arm_compute::TensorInfo aclNumDetections =
         armcomputetensorutils::BuildArmComputeTensorInfo(numDetections);

     return arm_compute::NEDetectionPostProcessLayer::validate(
             &aclBoxEncodings,
             &aclScores,
             &aclAnchors,
             &aclDetectionBoxes,
             &aclDetectionClasses,
             &aclDetectionScores,
             &aclNumDetections,
             info);
 }

 NeonDetectionPostProcessWorkload::NeonDetectionPostProcessWorkload(
     const DetectionPostProcessQueueDescriptor& descriptor,
     const WorkloadInfo& info)
     : BaseWorkload<DetectionPostProcessQueueDescriptor>(descriptor, info)
 {
     m_Anchors = std::make_unique<arm_compute::Tensor>();
     BuildArmComputeTensor(*m_Anchors, descriptor.m_Anchors->GetTensorInfo());

     arm_compute::DetectionPostProcessLayerInfo di = MakeInfo(m_Data.m_Parameters);

     auto AclTensorRef = [](ITensorHandle* tensor) -> arm_compute::ITensor&
         {
             return PolymorphicDowncast<IAclTensorHandle*>(tensor)->GetTensor();
         };

     arm_compute::ITensor& boxEncodings  = AclTensorRef(m_Data.m_Inputs[0]);
     arm_compute::ITensor& scores        = AclTensorRef(m_Data.m_Inputs[1]);

     arm_compute::ITensor& detectionBoxes    = AclTensorRef(m_Data.m_Outputs[0]);
     arm_compute::ITensor& detectionClasses  = AclTensorRef(m_Data.m_Outputs[1]);
     arm_compute::ITensor& detectionScores   = AclTensorRef(m_Data.m_Outputs[2]);
     arm_compute::ITensor& numDetections     = AclTensorRef(m_Data.m_Outputs[3]);

     m_Func.configure(&boxEncodings, &scores, m_Anchors.get(),
                      &detectionBoxes, &detectionClasses, &detectionScores, &numDetections,
                      di);

     InitializeArmComputeTensorData(*m_Anchors, m_Data.m_Anchors);
 }

 void NeonDetectionPostProcessWorkload::Execute() const
 {
     ARMNN_SCOPED_PROFILING_EVENT_NEON("NeonDetectionPostProcessWorkload_Execute");
     m_Func.run();
 }

 } // namespace armnn
NeonDetectionPostProcessWorkload.hpp

armnn::DetectionPostProcessQueueDescriptor
Definition: WorkloadData.hpp:221

armnn::TensorInfo
Definition: Tensor.hpp:152

armnn::BaseWorkload< DetectionPostProcessQueueDescriptor >::m_Data
const DetectionPostProcessQueueDescriptor m_Data
Definition: Workload.hpp:46

ARMNN_SCOPED_PROFILING_EVENT_NEON
#define ARMNN_SCOPED_PROFILING_EVENT_NEON(name)
Definition: NeonWorkloadUtils.hpp:17

armnn::DetectionPostProcessDescriptor::m_DetectionsPerClass
uint32_t m_DetectionsPerClass
Detections per classes, used in Regular NMS.
Definition: Descriptors.hpp:547

ArmComputeTensorUtils.hpp

boxEncodings
std::vector< float > boxEncodings({ 0.0f, 0.0f, 0.0f, 0.0f, 0.0f, 1.0f, 0.0f, 0.0f, 0.0f, -1.0f, 0.0f, 0.0f, 0.0f, 0.0f, 0.0f, 0.0f, 0.0f, 1.0f, 0.0f, 0.0f, 0.0f, 0.0f, 0.0f, 0.0f })

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition: 01_00_software_tools.dox:6

armnn::QueueDescriptorWithParameters::m_Parameters
LayerDescriptor m_Parameters
Definition: WorkloadData.hpp:57

armnn::DetectionPostProcessDescriptor::m_MaxClassesPerDetection
uint32_t m_MaxClassesPerDetection
Maximum numbers of classes per detection, used in Fast NMS.
Definition: Descriptors.hpp:545

PolymorphicDowncast.hpp

armnn::DetectionPostProcessDescriptor::m_MaxDetections
uint32_t m_MaxDetections
Maximum numbers of detections.
Definition: Descriptors.hpp:543

armnn::NeonDetectionPostProcessValidate
arm_compute::Status NeonDetectionPostProcessValidate(const TensorInfo &boxEncodings, const TensorInfo &scores, const TensorInfo &anchors, const TensorInfo &detectionBoxes, const TensorInfo &detectionClasses, const TensorInfo &detectionScores, const TensorInfo &numDetections, const DetectionPostProcessDescriptor &desc)
Definition: NeonDetectionPostProcessWorkload.cpp:32

armnn::BaseWorkload
Definition: Workload.hpp:28

armnn::DetectionPostProcessDescriptor::m_NmsIouThreshold
float m_NmsIouThreshold
Intersection over union threshold.
Definition: Descriptors.hpp:551

armnn::ITensorHandle
Definition: ITensorHandle.hpp:15

armnn::NeonDetectionPostProcessWorkload::NeonDetectionPostProcessWorkload
NeonDetectionPostProcessWorkload(const DetectionPostProcessQueueDescriptor &descriptor, const WorkloadInfo &info)
Definition: NeonDetectionPostProcessWorkload.cpp:75

armnn::Status
Status
enumeration
Definition: Types.hpp:26

armnn::DetectionPostProcessDescriptor::m_NumClasses
uint32_t m_NumClasses
Number of classes.
Definition: Descriptors.hpp:553

NeonWorkloadUtils.hpp

armnn::DetectionPostProcessQueueDescriptor::m_Anchors
const ConstCpuTensorHandle * m_Anchors
Definition: WorkloadData.hpp:228

armnn::DetectionPostProcessDescriptor::m_UseRegularNms
bool m_UseRegularNms
Use Regular NMS.
Definition: Descriptors.hpp:555

armnn::InitializeArmComputeTensorData
void InitializeArmComputeTensorData(arm_compute::Tensor &tensor, const ConstCpuTensorHandle *handle)
Definition: NeonWorkloadUtils.hpp:35

scores
std::vector< float > scores({ 0.0f, 0.9f, 0.8f, 0.0f, 0.75f, 0.72f, 0.0f, 0.6f, 0.5f, 0.0f, 0.93f, 0.95f, 0.0f, 0.5f, 0.4f, 0.0f, 0.3f, 0.2f })

armnn::QueueDescriptor::m_Outputs
std::vector< ITensorHandle * > m_Outputs
Definition: WorkloadData.hpp:31

armnn::BoostLogSeverityMapping::info

ArmComputeTensorHandle.hpp

armnn::WorkloadInfo
Contains information about inputs and outputs to a layer.
Definition: WorkloadInfo.hpp:16

armnn::DetectionPostProcessDescriptor::m_NmsScoreThreshold
float m_NmsScoreThreshold
NMS score threshold.
Definition: Descriptors.hpp:549

armnn::QueueDescriptor::m_Inputs
std::vector< ITensorHandle * > m_Inputs
Definition: WorkloadData.hpp:30

armnn::MakeInfo
arm_compute::DetectionPostProcessLayerInfo MakeInfo(const DetectionPostProcessDescriptor &desc)
Definition: NeonDetectionPostProcessWorkload.cpp:17

armnn::DetectionPostProcessDescriptor
Definition: Descriptors.hpp:511

armnn::NeonDetectionPostProcessWorkload::Execute
virtual void Execute() const override
Definition: NeonDetectionPostProcessWorkload.cpp:105

armnn::ConstCpuTensorHandle::GetTensorInfo
const TensorInfo & GetTensorInfo() const
Definition: CpuTensorHandle.hpp:37

anchors
std::vector< float > anchors({ 0.5f, 0.5f, 1.0f, 1.0f, 0.5f, 0.5f, 1.0f, 1.0f, 0.5f, 0.5f, 1.0f, 1.0f, 0.5f, 10.5f, 1.0f, 1.0f, 0.5f, 10.5f, 1.0f, 1.0f, 0.5f, 100.5f, 1.0f, 1.0f })