aboutsummaryrefslogtreecommitdiff
path: root/arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h
diff options
context:
space:
mode:
authorSiCong Li <sicong.li@arm.com>2017-07-28 14:46:20 +0100
committerAnthony Barbier <anthony.barbier@arm.com>2018-09-17 14:16:42 +0100
commitc51b72fe34e6018a1807a2c78228da7beeee1750 (patch)
treee1c969d6a54ae2561f8d4c6c35fd2534785f09b3 /arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h
parent572ade736ab344a62afa7da214cd9407fe53a281 (diff)
downloadComputeLibrary-c51b72fe34e6018a1807a2c78228da7beeee1750.tar.gz
COMPMID-355 Implement CL DirectConvolution1x1
* Add FP16 to validation tests. * Complete benchmark tests for CL and NEON Direct Convolution. Change-Id: Ie73d8580832372db01b82b39786fd9c8be560090 Reviewed-on: http://mpd-gerrit.cambridge.arm.com/82014 Reviewed-by: Anthony Barbier <anthony.barbier@arm.com> Tested-by: Kaizen <jeremy.johnson+kaizengerrit@arm.com>
Diffstat (limited to 'arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h')
-rw-r--r--arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h6
1 files changed, 3 insertions, 3 deletions
diff --git a/arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h b/arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h
index 8b43e18167..1e12ab95c1 100644
--- a/arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h
+++ b/arm_compute/runtime/CL/functions/CLDirectConvolutionLayer.h
@@ -45,7 +45,7 @@ public:
*
* @param[in] input Source tensor. 3 lower dimensions represent a single input [width, height, IFM],
* while every optional dimension from 4 and above represent a batch of inputs.
- * Data types supported: F32.
+ * Data types supported: F16, F32.
* @param[in] weights Weights tensor. Weights are 4D tensor with dimensions [kernel_x, kernel_y, IFM, OFM]. Data type supported:Same as @p input.
* @param[in] biases Biases tensor. Shared biases supported. Biases are 1D tensor with dimensions [OFM]. Data type supported:Same as @p input.
* @param[out] output Destination tensor. 3 lower dimensions represent a single output [width, height, OFM], while the rest represent batch of outputs.
@@ -58,8 +58,8 @@ public:
void run() override;
private:
- CLDirectConvolutionLayer3x3Kernel _direct_conv_kernel;
- CLFillBorderKernel _input_border_handler;
+ CLDirectConvolutionLayerKernel _direct_conv_kernel;
+ CLFillBorderKernel _input_border_handler;
};
}
#endif /* __ARM_COMPUTE_CLDIRECTCONVOLUTIONLAYER_H__ */