From c51b72fe34e6018a1807a2c78228da7beeee1750 Mon Sep 17 00:00:00 2001 From: SiCong Li Date: Fri, 28 Jul 2017 14:46:20 +0100 Subject: COMPMID-355 Implement CL DirectConvolution1x1 * Add FP16 to validation tests. * Complete benchmark tests for CL and NEON Direct Convolution. Change-Id: Ie73d8580832372db01b82b39786fd9c8be560090 Reviewed-on: http://mpd-gerrit.cambridge.arm.com/82014 Reviewed-by: Anthony Barbier Tested-by: Kaizen --- arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) (limited to 'arm_compute/runtime') diff --git a/arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h b/arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h index 8b43e18167..1e12ab95c1 100644 --- a/arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h +++ b/arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h @@ -45,7 +45,7 @@ public: * * @param[in] input Source tensor. 3 lower dimensions represent a single input [width, height, IFM], * while every optional dimension from 4 and above represent a batch of inputs. - * Data types supported: F32. + * Data types supported: F16, F32. * @param[in] weights Weights tensor. Weights are 4D tensor with dimensions [kernel_x, kernel_y, IFM, OFM]. Data type supported:Same as @p input. * @param[in] biases Biases tensor. Shared biases supported. Biases are 1D tensor with dimensions [OFM]. Data type supported:Same as @p input. * @param[out] output Destination tensor. 3 lower dimensions represent a single output [width, height, OFM], while the rest represent batch of outputs. @@ -58,8 +58,8 @@ public: void run() override; private: - CLDirectConvolutionLayer3x3Kernel _direct_conv_kernel; - CLFillBorderKernel _input_border_handler; + CLDirectConvolutionLayerKernel _direct_conv_kernel; + CLFillBorderKernel _input_border_handler; }; } #endif /* __ARM_COMPUTE_CLDIRECTCONVOLUTIONLAYER_H__ */ -- cgit v1.2.1