diff options
Diffstat (limited to 'arm_compute/core')
-rw-r--r-- | arm_compute/core/CL/kernels/CLActivationLayerKernel.h | 34 | ||||
-rw-r--r-- | arm_compute/core/NEON/kernels/NEActivationLayerKernel.h | 17 |
2 files changed, 39 insertions, 12 deletions
diff --git a/arm_compute/core/CL/kernels/CLActivationLayerKernel.h b/arm_compute/core/CL/kernels/CLActivationLayerKernel.h index 490e70544b..df22574de8 100644 --- a/arm_compute/core/CL/kernels/CLActivationLayerKernel.h +++ b/arm_compute/core/CL/kernels/CLActivationLayerKernel.h @@ -24,23 +24,45 @@ #ifndef __ARM_COMPUTE_CLACTIVATIONLAYERKERNEL_H__ #define __ARM_COMPUTE_CLACTIVATIONLAYERKERNEL_H__ -#include "arm_compute/core/CL/ICLSimple3DKernel.h" +#include "arm_compute/core/CL/ICLKernel.h" namespace arm_compute { class ICLTensor; /** Interface for the activation layer kernel. */ -class CLActivationLayerKernel : public ICLSimple3DKernel +class CLActivationLayerKernel : public ICLKernel { public: + /** Default constructor */ + CLActivationLayerKernel(); + /** Prevent instances of this class from being copied (As this class contains pointers) */ + CLActivationLayerKernel(const CLActivationLayerKernel &) = delete; + /** Prevent instances of this class from being copied (As this class contains pointers) */ + CLActivationLayerKernel &operator=(const CLActivationLayerKernel &) = delete; + /** Allow instances of this class to be moved */ + CLActivationLayerKernel(CLActivationLayerKernel &&) = default; + /** Allow instances of this class to be moved */ + CLActivationLayerKernel &operator=(CLActivationLayerKernel &&) = default; + /** Default destructor */ + ~CLActivationLayerKernel() = default; /** Set the input and output tensor. * - * @param[in] input Source tensor. Data types supported: F16, F32, U16, S16. - * @param[out] output Destination tensor. Data type should match the input data type. - * @param[in] act_info Activation layer information. + * @note If the output tensor is a nullptr, the activation function will be performed in-place + * + * @param[in, out] input Source tensor. In case of @p output tensor = nullptr, this tensor will store the result + * of the activation function. Data types supported: F16/F32. + * @param[out] output Destination tensor. Data type should match the input data type. + * @param[in] act_info Activation layer information. */ - void configure(const ICLTensor *input, ICLTensor *output, ActivationLayerInfo act_info); + void configure(ICLTensor *input, ICLTensor *output, ActivationLayerInfo act_info); + + // Inherited methods overridden: + void run(const Window &window, cl::CommandQueue &queue) override; + +private: + ICLTensor *_input; + ICLTensor *_output; }; } #endif /*__ARM_COMPUTE_CLACTIVATIONLAYERKERNEL_H__ */ diff --git a/arm_compute/core/NEON/kernels/NEActivationLayerKernel.h b/arm_compute/core/NEON/kernels/NEActivationLayerKernel.h index 97f92d6a1e..539bca587a 100644 --- a/arm_compute/core/NEON/kernels/NEActivationLayerKernel.h +++ b/arm_compute/core/NEON/kernels/NEActivationLayerKernel.h @@ -25,14 +25,14 @@ #define __ARM_COMPUTE_NEACTIVATIONLAYERKERNEL_H__ #include "arm_compute/core/FixedPoint.h" -#include "arm_compute/core/NEON/INESimpleKernel.h" +#include "arm_compute/core/NEON/INEKernel.h" namespace arm_compute { class ITensor; /** Interface for the activation layer kernel. */ -class NEActivationLayerKernel : public INESimpleKernel +class NEActivationLayerKernel : public INEKernel { public: /** Constructor */ @@ -47,11 +47,14 @@ public: NEActivationLayerKernel &operator=(NEActivationLayerKernel &&) = default; /** Set the input and output tensor. * - * @param[in] input Source tensor. Data types supported: QS8/F32. - * @param[out] output Destination tensor. Data type supported: same as @p input - * @param[in] activation_info Activation layer information. + * @note If the output tensor is a nullptr, the activation function will be performed in-place + * + * @param[in, out] input Source tensor. In case of @p output tensor = nullptr, this tensor will store the result + * of the activation function. Data types supported: QS8/F32. + * @param[out] output Destination tensor. Data type supported: same as @p input + * @param[in] activation_info Activation layer information. */ - void configure(const ITensor *input, ITensor *output, ActivationLayerInfo activation_info); + void configure(ITensor *input, ITensor *output, ActivationLayerInfo activation_info); // Inherited methods overridden: void run(const Window &window) override; @@ -77,6 +80,8 @@ private: typename std::enable_if<std::is_same<T, qint8_t>::value, void>::type activation(const Window &window); private: + ITensor *_input; + ITensor *_output; ActivationFunctionExecutorPtr _func; ActivationLayerInfo _act_info; }; |