aboutsummaryrefslogtreecommitdiff
path: root/src/backends/neon/workloads/NeonRsqrtWorkload.cpp
diff options
context:
space:
mode:
authorAron Virginas-Tar <Aron.Virginas-Tar@arm.com>2019-09-10 13:55:09 +0100
committerÁron Virginás-Tar <aron.virginas-tar@arm.com>2019-09-10 13:56:46 +0000
commit0dd3b43e1497ab406acfdefca425143fbefb1ee4 (patch)
tree9306c9f62402329306c171ca6d4d5107e43c2a2e /src/backends/neon/workloads/NeonRsqrtWorkload.cpp
parent4ffcc8fb1d4c893e62a8c1fb330fe2742cff5407 (diff)
downloadarmnn-0dd3b43e1497ab406acfdefca425143fbefb1ee4.tar.gz
IVGCVSW-3830 Add NEON workload for RSQRT
Signed-off-by: Aron Virginas-Tar <Aron.Virginas-Tar@arm.com> Change-Id: Ida590b7d28dbee40e496794c42b682d740427cca
Diffstat (limited to 'src/backends/neon/workloads/NeonRsqrtWorkload.cpp')
-rw-r--r--src/backends/neon/workloads/NeonRsqrtWorkload.cpp43
1 files changed, 43 insertions, 0 deletions
diff --git a/src/backends/neon/workloads/NeonRsqrtWorkload.cpp b/src/backends/neon/workloads/NeonRsqrtWorkload.cpp
new file mode 100644
index 0000000000..b6292833dd
--- /dev/null
+++ b/src/backends/neon/workloads/NeonRsqrtWorkload.cpp
@@ -0,0 +1,43 @@
+//
+// Copyright © 2019 Arm Ltd. All rights reserved.
+// SPDX-License-Identifier: MIT
+//
+
+#include "NeonRsqrtWorkload.hpp"
+
+#include "NeonWorkloadUtils.hpp"
+
+#include <aclCommon/ArmComputeTensorHandle.hpp>
+#include <aclCommon/ArmComputeTensorUtils.hpp>
+
+#include <boost/cast.hpp>
+
+namespace armnn
+{
+
+arm_compute::Status NeonRsqrtWorkloadValidate(const TensorInfo& input, const TensorInfo& output)
+{
+ const arm_compute::TensorInfo aclInput = armcomputetensorutils::BuildArmComputeTensorInfo(input);
+ const arm_compute::TensorInfo aclOutput = armcomputetensorutils::BuildArmComputeTensorInfo(output);
+
+ return arm_compute::NERsqrtLayer::validate(&aclInput, &aclOutput);
+}
+
+NeonRsqrtWorkload::NeonRsqrtWorkload(const RsqrtQueueDescriptor& descriptor, const WorkloadInfo& info)
+ : BaseWorkload<RsqrtQueueDescriptor>(descriptor, info)
+{
+ m_Data.ValidateInputsOutputs("NeonRsqrtWorkload", 1, 1);
+
+ arm_compute::ITensor& input = boost::polymorphic_downcast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
+ arm_compute::ITensor& output = boost::polymorphic_downcast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
+
+ m_RsqrtLayer.configure(&input, &output);
+}
+
+void NeonRsqrtWorkload::Execute() const
+{
+ ARMNN_SCOPED_PROFILING_EVENT_NEON("NeonRsqrtWorkload_Execute");
+ m_RsqrtLayer.run();
+}
+
+} // namespace armnn