aboutsummaryrefslogtreecommitdiff
path: root/arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h
diff options
context:
space:
mode:
authorManuel Bottini <manuel.bottini@arm.com>2020-09-15 13:03:34 +0100
committerGeorgios Pinitas <georgios.pinitas@arm.com>2020-10-14 09:49:04 +0000
commit87350f47084d2b69daa11c3b1c7eb47e02260063 (patch)
tree9324b91dd5b154209c3af24ceec02286537ddf36 /arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h
parentcbede286da8711031fb6fc56bb2e2c246a4c5455 (diff)
downloadComputeLibrary-87350f47084d2b69daa11c3b1c7eb47e02260063.tar.gz
COMPMID-3144: Remove padding from NEDirectConvolutionLayerKernel
Change-Id: I22b907eebfbe037e6e1c7bf604172f4709a9cbed Signed-off-by: Manuel Bottini <manuel.bottini@arm.com> Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/4082 Tested-by: Arm Jenkins <bsgcomp@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Michele Di Giorgio <michele.digiorgio@arm.com> Reviewed-by: Georgios Pinitas <georgios.pinitas@arm.com>
Diffstat (limited to 'arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h')
-rw-r--r--arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h10
1 files changed, 9 insertions, 1 deletions
diff --git a/arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h b/arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h
index 4cb9c90a1a..c927aff1eb 100644
--- a/arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h
+++ b/arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h
@@ -1,5 +1,5 @@
/*
- * Copyright (c) 2017-2019 Arm Limited.
+ * Copyright (c) 2017-2020 Arm Limited.
*
* SPDX-License-Identifier: MIT
*
@@ -86,6 +86,14 @@ public:
BorderSize border_size() const override;
private:
+ /* Template function for optimized convolution NHWC */
+ template <typename T>
+ void convolve_nhwc_optimized(const Window &window);
+
+ /* Template function for convolution NHWC */
+ template <typename T>
+ void convolve_nhwc(const Window &window);
+
const ITensor *_input;
const ITensor *_weights;
ITensor *_output;