diff options
Diffstat (limited to 'src/backends/cl/workloads')
-rw-r--r-- | src/backends/cl/workloads/CMakeLists.txt | 2 | ||||
-rw-r--r-- | src/backends/cl/workloads/ClDequantizeWorkload.cpp | 55 | ||||
-rw-r--r-- | src/backends/cl/workloads/ClDequantizeWorkload.hpp | 28 | ||||
-rw-r--r-- | src/backends/cl/workloads/ClWorkloads.hpp | 1 |
4 files changed, 86 insertions, 0 deletions
diff --git a/src/backends/cl/workloads/CMakeLists.txt b/src/backends/cl/workloads/CMakeLists.txt index 23668c564b..c055244b1f 100644 --- a/src/backends/cl/workloads/CMakeLists.txt +++ b/src/backends/cl/workloads/CMakeLists.txt @@ -24,6 +24,8 @@ list(APPEND armnnClBackendWorkloads_sources ClConvolution2dWorkload.hpp ClDepthwiseConvolutionWorkload.cpp ClDepthwiseConvolutionWorkload.hpp + ClDequantizeWorkload.cpp + ClDequantizeWorkload.hpp ClDivisionFloatWorkload.cpp ClDivisionFloatWorkload.hpp ClFloorFloatWorkload.cpp diff --git a/src/backends/cl/workloads/ClDequantizeWorkload.cpp b/src/backends/cl/workloads/ClDequantizeWorkload.cpp new file mode 100644 index 0000000000..67a555a020 --- /dev/null +++ b/src/backends/cl/workloads/ClDequantizeWorkload.cpp @@ -0,0 +1,55 @@ +// +// Copyright © 2017 Arm Ltd. All rights reserved. +// SPDX-License-Identifier: MIT +// + +#include "ClDequantizeWorkload.hpp" +#include "ClWorkloadUtils.hpp" + +#include <aclCommon/ArmComputeTensorUtils.hpp> +#include <backendsCommon/CpuTensorHandle.hpp> + +#include <arm_compute/core/Types.h> + +#include <cl/ClLayerSupport.hpp> +#include <cl/ClTensorHandle.hpp> + +#include <boost/polymorphic_pointer_cast.hpp> + +namespace armnn +{ +using namespace armcomputetensorutils; + +arm_compute::Status ClDequantizeWorkloadValidate(const TensorInfo& input, const TensorInfo& output) +{ + const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input); + const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output); + + return arm_compute::CLDequantizationLayer::validate(&aclInputInfo, &aclOutputInfo); +} + +ClDequantizeWorkload::ClDequantizeWorkload(const DequantizeQueueDescriptor& descriptor, + const WorkloadInfo& workloadInfo) + : BaseWorkload<DequantizeQueueDescriptor>(descriptor, workloadInfo) +{ + arm_compute::ICLTensor& input = boost::polymorphic_pointer_downcast<IClTensorHandle>( + m_Data.m_Inputs[0])->GetTensor(); + + arm_compute::ICLTensor& output = boost::polymorphic_pointer_downcast<IClTensorHandle>( + m_Data.m_Outputs[0])->GetTensor(); + + m_Layer.reset(new arm_compute::CLDequantizationLayer()); + m_Layer->configure(&input, &output); + m_Layer->prepare(); +} + +void ClDequantizeWorkload::Execute() const +{ + if (m_Layer) + { + ARMNN_SCOPED_PROFILING_EVENT_CL("ClDequantizeWorkload_Execute"); + m_Layer->run(); + } +} + +} // namespace armnn diff --git a/src/backends/cl/workloads/ClDequantizeWorkload.hpp b/src/backends/cl/workloads/ClDequantizeWorkload.hpp new file mode 100644 index 0000000000..6e61da2ebf --- /dev/null +++ b/src/backends/cl/workloads/ClDequantizeWorkload.hpp @@ -0,0 +1,28 @@ +// +// Copyright © 2017 Arm Ltd. All rights reserved. +// SPDX-License-Identifier: MIT +// + +#pragma once + +#include <backendsCommon/Workload.hpp> + +#include <arm_compute/runtime/CL/functions/CLDequantizationLayer.h> + +namespace armnn +{ + +arm_compute::Status ClDequantizeWorkloadValidate(const TensorInfo& input, const TensorInfo& output); + +class ClDequantizeWorkload : public BaseWorkload<DequantizeQueueDescriptor> +{ +public: + ClDequantizeWorkload(const DequantizeQueueDescriptor& descriptor, const WorkloadInfo& workloadInfo); + + void Execute() const override; + +private: + mutable std::unique_ptr<arm_compute::CLDequantizationLayer> m_Layer; +}; + +} // namespace armnn
\ No newline at end of file diff --git a/src/backends/cl/workloads/ClWorkloads.hpp b/src/backends/cl/workloads/ClWorkloads.hpp index 0060412770..b836781166 100644 --- a/src/backends/cl/workloads/ClWorkloads.hpp +++ b/src/backends/cl/workloads/ClWorkloads.hpp @@ -11,6 +11,7 @@ #include "ClBatchToSpaceNdWorkload.hpp" #include "ClConvolution2dWorkload.hpp" #include "ClDepthwiseConvolutionWorkload.hpp" +#include "ClDequantizeWorkload.hpp" #include "ClDivisionFloatWorkload.hpp" #include "ClFloorFloatWorkload.hpp" #include "ClFullyConnectedWorkload.hpp" |