diff options
Diffstat (limited to 'src/backends/neon/workloads/NeonRsqrtWorkload.cpp')
-rw-r--r-- | src/backends/neon/workloads/NeonRsqrtWorkload.cpp | 43 |
1 files changed, 43 insertions, 0 deletions
diff --git a/src/backends/neon/workloads/NeonRsqrtWorkload.cpp b/src/backends/neon/workloads/NeonRsqrtWorkload.cpp new file mode 100644 index 0000000000..b6292833dd --- /dev/null +++ b/src/backends/neon/workloads/NeonRsqrtWorkload.cpp @@ -0,0 +1,43 @@ +// +// Copyright © 2019 Arm Ltd. All rights reserved. +// SPDX-License-Identifier: MIT +// + +#include "NeonRsqrtWorkload.hpp" + +#include "NeonWorkloadUtils.hpp" + +#include <aclCommon/ArmComputeTensorHandle.hpp> +#include <aclCommon/ArmComputeTensorUtils.hpp> + +#include <boost/cast.hpp> + +namespace armnn +{ + +arm_compute::Status NeonRsqrtWorkloadValidate(const TensorInfo& input, const TensorInfo& output) +{ + const arm_compute::TensorInfo aclInput = armcomputetensorutils::BuildArmComputeTensorInfo(input); + const arm_compute::TensorInfo aclOutput = armcomputetensorutils::BuildArmComputeTensorInfo(output); + + return arm_compute::NERsqrtLayer::validate(&aclInput, &aclOutput); +} + +NeonRsqrtWorkload::NeonRsqrtWorkload(const RsqrtQueueDescriptor& descriptor, const WorkloadInfo& info) + : BaseWorkload<RsqrtQueueDescriptor>(descriptor, info) +{ + m_Data.ValidateInputsOutputs("NeonRsqrtWorkload", 1, 1); + + arm_compute::ITensor& input = boost::polymorphic_downcast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor(); + arm_compute::ITensor& output = boost::polymorphic_downcast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor(); + + m_RsqrtLayer.configure(&input, &output); +} + +void NeonRsqrtWorkload::Execute() const +{ + ARMNN_SCOPED_PROFILING_EVENT_NEON("NeonRsqrtWorkload_Execute"); + m_RsqrtLayer.run(); +} + +} // namespace armnn |