aboutsummaryrefslogtreecommitdiff
path: root/arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h
diff options
context:
space:
mode:
authorsteniu01 <steven.niu@arm.com>2017-07-18 17:37:43 +0100
committerAnthony Barbier <anthony.barbier@arm.com>2018-09-17 14:16:42 +0100
commit27b386cb7596542a3296c32e41f7a5168b4d53be (patch)
tree8c4eb09de748069f4426dd012798933fadc88e03 /arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h
parent1b80b6c7255e41257fed3b4dd0fa018e2eeee4c2 (diff)
downloadComputeLibrary-27b386cb7596542a3296c32e41f7a5168b4d53be.tar.gz
COMPMID-355 Implement 3x3 CL direct convolution
Change-Id: I1b44dc375045964e65557f0ead57a7c12d6bf097 Reviewed-on: http://mpd-gerrit.cambridge.arm.com/81418 Tested-by: Kaizen <jeremy.johnson+kaizengerrit@arm.com> Reviewed-by: Anthony Barbier <anthony.barbier@arm.com>
Diffstat (limited to 'arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h')
-rw-r--r--arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h21
1 files changed, 11 insertions, 10 deletions
diff --git a/arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h b/arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h
index d726071606..5612e1ae62 100644
--- a/arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h
+++ b/arm_compute/core/NEON/kernels/NEDirectConvolutionLayerKernel.h
@@ -46,16 +46,17 @@ public:
NEDirectConvolutionLayerKernel &operator=(NEDirectConvolutionLayerKernel &&) = default;
/** Default destructor */
~NEDirectConvolutionLayerKernel() = default;
- /** Set the input, weights and output tensors.
- *
- * @param[in] input Input tensor. Data types supported: QS8/F32.
- * @param[in] weights Set of kernels to convolve the input volume.
- * The 3rd dimension must be the same as the input's volume 3rd dimension.
- * Data type supported: Same as @p input.
- * @param[out] output Output tensor.
- * The 3rd dimensions must be equal to the 4th dimension of the @p kernels tensor. Data types supported: Same as @p input.
- * @param[in] conv_info Contains padding and stride information described in @ref PadStrideInfo.
- */
+ /** Set the input, weights, and output tensors.
+ *
+ * @param[in] input The input tensor to convolve. 3 lower dimensions represent a single input [width, height, IFM],
+ * while every optional dimension from 4 and above represent a batch of inputs. Data types supported: QS8/F32.
+ * @param[in] weights Weights tensor. Weights are 4D tensor with dimensions [kernel_x, kernel_y, IFM, OFM].
+ * The 3rd dimension must be the same as the input's volume 3rd dimension.
+ * Data type supported:Same as @p input.
+ * @param[out] output Output tensor.
+ * The 3rd dimensions must be equal to the 4th dimension of the @p kernels tensor. Data types supported: Same as @p input.
+ * @param[in] conv_info Contains padding and stride information described in @ref PadStrideInfo.
+ */
void configure(const ITensor *input, const ITensor *weights, ITensor *output, const PadStrideInfo &conv_info);
// Inherited methods overridden: