diff options
Diffstat (limited to 'src/backends/cl/workloads/ClGatherNdWorkload.hpp')
-rw-r--r-- | src/backends/cl/workloads/ClGatherNdWorkload.hpp | 42 |
1 files changed, 42 insertions, 0 deletions
diff --git a/src/backends/cl/workloads/ClGatherNdWorkload.hpp b/src/backends/cl/workloads/ClGatherNdWorkload.hpp new file mode 100644 index 0000000000..dd30024cc7 --- /dev/null +++ b/src/backends/cl/workloads/ClGatherNdWorkload.hpp @@ -0,0 +1,42 @@ +// +// Copyright © 2022 Arm Ltd and Contributors. All rights reserved. +// SPDX-License-Identifier: MIT +// + +#pragma once + +#include "ClBaseWorkload.hpp" + +#include "arm_compute/runtime/Tensor.h" +#include "arm_compute/runtime/CL/functions/CLGather.h" +#include "arm_compute/runtime/CL/functions/CLPixelWiseMultiplication.h" +#include "arm_compute/runtime/CL/functions/CLReductionOperation.h" +#include "arm_compute/runtime/CL/functions/CLReshapeLayer.h" + +namespace armnn +{ +arm_compute::Status ClGatherNdWorkloadValidate(const TensorInfo& params, + const TensorInfo& indices, + const TensorInfo& output); + +class ClGatherNdWorkload : public ClBaseWorkload<GatherNdQueueDescriptor> +{ +public: + ClGatherNdWorkload(const GatherNdQueueDescriptor& descriptor, + const WorkloadInfo& info, + const arm_compute::CLCompileContext& clCompileContext); + virtual void Execute() const override; + +private: + arm_compute::CLTensor m_FlattenedCoeff; + arm_compute::CLTensor m_OutputMul; + arm_compute::CLTensor m_FlattenedIndices; + arm_compute::CLTensor m_OutputGather; + + mutable arm_compute::CLPixelWiseMultiplication m_MulLayer; + mutable arm_compute::CLReductionOperation m_ReduceSumLayer; + mutable arm_compute::CLGather m_GatherLayer; + mutable arm_compute::CLReshapeLayer m_ReshapeLayer; +}; + +} //namespace armnn
\ No newline at end of file |