plain/23.05/_neon_detection_post_process_workload_8cpp_source.xhtml

//

// Copyright © 2019 Arm Ltd and Contributors. All rights reserved.

// SPDX-License-Identifier: MIT

//


#include "NeonDetectionPostProcessWorkload.hpp"


#include "NeonWorkloadUtils.hpp"


#include <aclCommon/ArmComputeTensorHandle.hpp>

#include <aclCommon/ArmComputeTensorUtils.hpp>

#include <armnn/utility/PolymorphicDowncast.hpp>


namespace armnn

{


arm_compute::DetectionPostProcessLayerInfo MakeInfo(const DetectionPostProcessDescriptor& descriptor)

{

    return arm_compute::DetectionPostProcessLayerInfo(descriptor.m_MaxDetections,

                                                      descriptor.m_MaxClassesPerDetection,

                                                      descriptor.m_NmsScoreThreshold,

                                                      descriptor.m_NmsIouThreshold,

                                                      descriptor.m_NumClasses,

                                                      { descriptor.m_ScaleX,

                                                        descriptor.m_ScaleY,

                                                        descriptor.m_ScaleW,

                                                        descriptor.m_ScaleH },

                                                      descriptor.m_UseRegularNms,

                                                      descriptor.m_DetectionsPerClass);

}


arm_compute::Status NeonDetectionPostProcessValidate(const TensorInfo& boxEncodings,

                                                     const TensorInfo& scores,

                                                     const TensorInfo& anchors,

                                                     const TensorInfo& detectionBoxes,

                                                     const TensorInfo& detectionClasses,

                                                     const TensorInfo& detectionScores,

                                                     const TensorInfo& numDetections,

                                                     const DetectionPostProcessDescriptor &descriptor)

{

    arm_compute::DetectionPostProcessLayerInfo info = MakeInfo(descriptor);


    const arm_compute::TensorInfo aclBoxEncodings =

        armcomputetensorutils::BuildArmComputeTensorInfo(boxEncodings);


    const arm_compute::TensorInfo aclScores =

        armcomputetensorutils::BuildArmComputeTensorInfo(scores);


    const arm_compute::TensorInfo aclAnchors =

        armcomputetensorutils::BuildArmComputeTensorInfo(anchors);


    arm_compute::TensorInfo aclDetectionBoxes =

        armcomputetensorutils::BuildArmComputeTensorInfo(detectionBoxes);


    arm_compute::TensorInfo aclDetectionClasses =

        armcomputetensorutils::BuildArmComputeTensorInfo(detectionClasses);


    arm_compute::TensorInfo aclDetectionScores =

        armcomputetensorutils::BuildArmComputeTensorInfo(detectionScores);


    arm_compute::TensorInfo aclNumDetections =

        armcomputetensorutils::BuildArmComputeTensorInfo(numDetections);


    return arm_compute::NEDetectionPostProcessLayer::validate(

            &aclBoxEncodings,

            &aclScores,

            &aclAnchors,

            &aclDetectionBoxes,

            &aclDetectionClasses,

            &aclDetectionScores,

            &aclNumDetections,

            info);

}


NeonDetectionPostProcessWorkload::NeonDetectionPostProcessWorkload(

    const DetectionPostProcessQueueDescriptor& descriptor,

    const WorkloadInfo& info)

    : NeonBaseWorkload<DetectionPostProcessQueueDescriptor>(descriptor, info)

{

    // Report Profiling Details

    ARMNN_REPORT_PROFILING_WORKLOAD_DESC("NeonDetectionPostProcessWorkload_Construct",

                                         descriptor.m_Parameters,

                                         info,

                                         this->GetGuid());


    m_Anchors = std::make_unique<arm_compute::Tensor>();

    BuildArmComputeTensor(*m_Anchors, descriptor.m_Anchors->GetTensorInfo());


    arm_compute::DetectionPostProcessLayerInfo di = MakeInfo(m_Data.m_Parameters);


    auto AclTensorRef = [](ITensorHandle* tensor) -> arm_compute::ITensor&

        {

            return PolymorphicDowncast<IAclTensorHandle*>(tensor)->GetTensor();

        };


    arm_compute::ITensor& boxEncodings  = AclTensorRef(m_Data.m_Inputs[0]);

    arm_compute::ITensor& scores        = AclTensorRef(m_Data.m_Inputs[1]);


    arm_compute::ITensor& detectionBoxes    = AclTensorRef(m_Data.m_Outputs[0]);

    arm_compute::ITensor& detectionClasses  = AclTensorRef(m_Data.m_Outputs[1]);

    arm_compute::ITensor& detectionScores   = AclTensorRef(m_Data.m_Outputs[2]);

    arm_compute::ITensor& numDetections     = AclTensorRef(m_Data.m_Outputs[3]);


    m_Func.configure(&boxEncodings, &scores, m_Anchors.get(),

                     &detectionBoxes, &detectionClasses, &detectionScores, &numDetections,

                     di);


    InitializeArmComputeTensorData(*m_Anchors, m_Data.m_Anchors);

}


void NeonDetectionPostProcessWorkload::Execute() const

{

    ARMNN_SCOPED_PROFILING_EVENT_NEON_GUID("NeonDetectionPostProcessWorkload_Execute", this->GetGuid());

    m_Func.run();

}


} // namespace armnn