diff options
author | Giorgio Arena <giorgio.arena@arm.com> | 2018-07-02 15:29:57 +0100 |
---|---|---|
committer | Anthony Barbier <anthony.barbier@arm.com> | 2018-11-02 16:54:54 +0000 |
commit | eff8d95991205e874091576e2d225f63246dd0bb (patch) | |
tree | a0dc2ab5544c7dbc68d7e2af3ae72101b8247e6a /src/core/CL/CLKernelLibrary.cpp | |
parent | 74b671bc2da803ef60bcdec62923943960eb3acd (diff) | |
download | ComputeLibrary-eff8d95991205e874091576e2d225f63246dd0bb.tar.gz |
COMPMID-1316 Using 8 bit dot product instruction in CLDepthWiseConvolution with QASYMM8
Change-Id: I3fc37bdceaae8b4b1effa51129b71bf352388564
Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/138374
Tested-by: Jenkins <bsgcomp@arm.com>
Reviewed-by: Anthony Barbier <anthony.barbier@arm.com>
Reviewed-by: Gian Marco Iodice <gianmarco.iodice@arm.com>
Diffstat (limited to 'src/core/CL/CLKernelLibrary.cpp')
-rw-r--r-- | src/core/CL/CLKernelLibrary.cpp | 9 |
1 files changed, 8 insertions, 1 deletions
diff --git a/src/core/CL/CLKernelLibrary.cpp b/src/core/CL/CLKernelLibrary.cpp index 475352456c..64519ff459 100644 --- a/src/core/CL/CLKernelLibrary.cpp +++ b/src/core/CL/CLKernelLibrary.cpp @@ -200,8 +200,10 @@ const std::map<std::string, std::string> CLKernelLibrary::_kernel_program_map = { "depthwise_convolution_3x3_nhwc", "depthwise_convolution.cl" }, { "depthwise_convolution_3x3_nhwc_stride1", "depthwise_convolution.cl" }, { "depthwise_convolution_3x3_quantized_nchw", "depthwise_convolution_quantized.cl" }, + { "depthwise_convolution_3x3_quantized_nhwc", "depthwise_convolution_quantized.cl" }, { "depthwise_convolution_3x3_quantized_nhwc_stride1", "depthwise_convolution_quantized.cl" }, - { "depthwise_convolution_3x3_quantized_nhwc_stride2", "depthwise_convolution_quantized.cl" }, + { "depthwise_convolution_3x3_quantized_dot8_nchw", "depthwise_convolution_quantized.cl" }, + { "depthwise_convolution_3x3_quantized_dot8_nhwc_stride1", "depthwise_convolution_quantized.cl" }, { "depthwise_convolution_3x3_stridex1_stridey1_bifrost_f16", "depthwise_convolution.cl" }, { "depthwise_convolution_3x3_stridex2_stridey2_bifrost_f16", "depthwise_convolution.cl" }, { "depthwise_convolution_3x3_stridex1_stridey1_bifrost_f32", "depthwise_convolution.cl" }, @@ -810,6 +812,11 @@ Kernel CLKernelLibrary::create_kernel(const std::string &kernel_name, const Stri concat_str += " -DARM_COMPUTE_OPENCL_DOT8_ENABLED=1 "; } + if(dot8_acc_supported(_device)) + { + concat_str += " -DARM_COMPUTE_OPENCL_DOT8_ACC_ENABLED=1 "; + } + if(get_cl_version(_device) == CLVersion::CL20) { concat_str += " -cl-std=CL2.0 "; |