diff options
author | Narumol Prangnawarat <narumol.prangnawarat@arm.com> | 2019-05-30 16:47:12 +0100 |
---|---|---|
committer | Narumol Prangnawarat <narumol.prangnawarat@arm.com> | 2019-05-31 10:04:02 +0000 |
commit | 01961a7df1c4357981a33b9c1eb80fb51888a8fa (patch) | |
tree | 4ead27fb4bcc24cc54b59c8ea5ab56ca0f7e028a /src/backends/neon/workloads | |
parent | 20ec2497c4059e39f43a38ceb2ba99f1a7b760f1 (diff) | |
download | armnn-01961a7df1c4357981a33b9c1eb80fb51888a8fa.tar.gz |
IVGCVSW-3148 Add Neon backend support for Dequantize
* Add NeonDequantizeWorkload
* Add IsDequantizeSupported to call validate from ACL function
* Add CreateDequantize to NeonWorkloadFactory
* Unit tests
Signed-off-by: Narumol Prangnawarat <narumol.prangnawarat@arm.com>
Change-Id: I96a216ef78cc3f6a57aa439a16ae6aafd783ff93
Diffstat (limited to 'src/backends/neon/workloads')
-rw-r--r-- | src/backends/neon/workloads/CMakeLists.txt | 2 | ||||
-rw-r--r-- | src/backends/neon/workloads/NeonDequantizeWorkload.cpp | 48 | ||||
-rw-r--r-- | src/backends/neon/workloads/NeonDequantizeWorkload.hpp | 31 | ||||
-rw-r--r-- | src/backends/neon/workloads/NeonWorkloads.hpp | 1 |
4 files changed, 82 insertions, 0 deletions
diff --git a/src/backends/neon/workloads/CMakeLists.txt b/src/backends/neon/workloads/CMakeLists.txt index b7638208d1..f6568e1f7e 100644 --- a/src/backends/neon/workloads/CMakeLists.txt +++ b/src/backends/neon/workloads/CMakeLists.txt @@ -22,6 +22,8 @@ list(APPEND armnnNeonBackendWorkloads_sources NeonConvolution2dWorkload.hpp NeonDepthwiseConvolutionWorkload.cpp NeonDepthwiseConvolutionWorkload.hpp + NeonDequantizeWorkload.cpp + NeonDequantizeWorkload.hpp NeonFloorFloatWorkload.cpp NeonFloorFloatWorkload.hpp NeonFullyConnectedWorkload.cpp diff --git a/src/backends/neon/workloads/NeonDequantizeWorkload.cpp b/src/backends/neon/workloads/NeonDequantizeWorkload.cpp new file mode 100644 index 0000000000..9840b48dd2 --- /dev/null +++ b/src/backends/neon/workloads/NeonDequantizeWorkload.cpp @@ -0,0 +1,48 @@ +// +// Copyright © 2017 Arm Ltd. All rights reserved. +// SPDX-License-Identifier: MIT +// + +#include "NeonDequantizeWorkload.hpp" + +#include "NeonWorkloadUtils.hpp" + +#include <aclCommon/ArmComputeTensorUtils.hpp> +#include <backendsCommon/CpuTensorHandle.hpp> +#include <neon/NeonTensorHandle.hpp> + +namespace armnn +{ + +using namespace armcomputetensorutils; + +arm_compute::Status NeonDequantizeWorkloadValidate(const TensorInfo& input, + const TensorInfo& output) +{ + const arm_compute::TensorInfo aclInput = BuildArmComputeTensorInfo(input); + const arm_compute::TensorInfo aclOutput = BuildArmComputeTensorInfo(output); + + return arm_compute::NEDequantizationLayer::validate(&aclInput, &aclOutput); +} + +NeonDequantizeWorkload::NeonDequantizeWorkload(const DequantizeQueueDescriptor& descriptor, const WorkloadInfo& info) + : BaseWorkload<DequantizeQueueDescriptor>(descriptor, info) +{ + m_Data.ValidateInputsOutputs("NeonDequantizeWorkload", 1, 1); + + arm_compute::ITensor& input = boost::polymorphic_downcast<INeonTensorHandle*>(m_Data.m_Inputs[0])->GetTensor(); + arm_compute::ITensor& output = boost::polymorphic_downcast<INeonTensorHandle*>(m_Data.m_Outputs[0])->GetTensor(); + + m_Layer.reset(new arm_compute::NEDequantizationLayer()); + m_Layer->configure(&input, &output); + m_Layer->prepare(); +} + +void NeonDequantizeWorkload::Execute() const +{ + ARMNN_SCOPED_PROFILING_EVENT_NEON("NeonDequantizeWorkload_Execute"); + m_Layer->run(); +} + +} //namespace armnn + diff --git a/src/backends/neon/workloads/NeonDequantizeWorkload.hpp b/src/backends/neon/workloads/NeonDequantizeWorkload.hpp new file mode 100644 index 0000000000..a6616376e7 --- /dev/null +++ b/src/backends/neon/workloads/NeonDequantizeWorkload.hpp @@ -0,0 +1,31 @@ +// +// Copyright © 2017 Arm Ltd. All rights reserved. +// SPDX-License-Identifier: MIT +// + +#pragma once + +#include <backendsCommon/Workload.hpp> + +#include <arm_compute/runtime/NEON/NEFunctions.h> + +#include <functional> + +namespace armnn +{ + +arm_compute::Status NeonDequantizeWorkloadValidate(const TensorInfo& input, + const TensorInfo& output); + +class NeonDequantizeWorkload : public BaseWorkload<DequantizeQueueDescriptor> +{ +public: + NeonDequantizeWorkload(const DequantizeQueueDescriptor& descriptor, const WorkloadInfo& info); + + void Execute() const override; + +private: + mutable std::unique_ptr<arm_compute::NEDequantizationLayer> m_Layer; +}; + +} //namespace armnn diff --git a/src/backends/neon/workloads/NeonWorkloads.hpp b/src/backends/neon/workloads/NeonWorkloads.hpp index 8ad70d7095..ecd50c9d02 100644 --- a/src/backends/neon/workloads/NeonWorkloads.hpp +++ b/src/backends/neon/workloads/NeonWorkloads.hpp @@ -12,6 +12,7 @@ #include "NeonConvertFp32ToFp16Workload.hpp" #include "NeonConvolution2dWorkload.hpp" #include "NeonDepthwiseConvolutionWorkload.hpp" +#include "NeonDequantizeWorkload.hpp" #include "NeonFloorFloatWorkload.hpp" #include "NeonFullyConnectedWorkload.hpp" #include "NeonGreaterWorkload.hpp" |