aboutsummaryrefslogtreecommitdiff
path: root/src/core/CL/CLKernelLibrary.cpp
diff options
context:
space:
mode:
authorGiorgio Arena <giorgio.arena@arm.com>2018-07-02 15:29:57 +0100
committerAnthony Barbier <anthony.barbier@arm.com>2018-11-02 16:54:54 +0000
commiteff8d95991205e874091576e2d225f63246dd0bb (patch)
treea0dc2ab5544c7dbc68d7e2af3ae72101b8247e6a /src/core/CL/CLKernelLibrary.cpp
parent74b671bc2da803ef60bcdec62923943960eb3acd (diff)
downloadComputeLibrary-eff8d95991205e874091576e2d225f63246dd0bb.tar.gz
COMPMID-1316 Using 8 bit dot product instruction in CLDepthWiseConvolution with QASYMM8
Change-Id: I3fc37bdceaae8b4b1effa51129b71bf352388564 Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/138374 Tested-by: Jenkins <bsgcomp@arm.com> Reviewed-by: Anthony Barbier <anthony.barbier@arm.com> Reviewed-by: Gian Marco Iodice <gianmarco.iodice@arm.com>
Diffstat (limited to 'src/core/CL/CLKernelLibrary.cpp')
-rw-r--r--src/core/CL/CLKernelLibrary.cpp9
1 files changed, 8 insertions, 1 deletions
diff --git a/src/core/CL/CLKernelLibrary.cpp b/src/core/CL/CLKernelLibrary.cpp
index 475352456c..64519ff459 100644
--- a/src/core/CL/CLKernelLibrary.cpp
+++ b/src/core/CL/CLKernelLibrary.cpp
@@ -200,8 +200,10 @@ const std::map<std::string, std::string> CLKernelLibrary::_kernel_program_map =
{ "depthwise_convolution_3x3_nhwc", "depthwise_convolution.cl" },
{ "depthwise_convolution_3x3_nhwc_stride1", "depthwise_convolution.cl" },
{ "depthwise_convolution_3x3_quantized_nchw", "depthwise_convolution_quantized.cl" },
+ { "depthwise_convolution_3x3_quantized_nhwc", "depthwise_convolution_quantized.cl" },
{ "depthwise_convolution_3x3_quantized_nhwc_stride1", "depthwise_convolution_quantized.cl" },
- { "depthwise_convolution_3x3_quantized_nhwc_stride2", "depthwise_convolution_quantized.cl" },
+ { "depthwise_convolution_3x3_quantized_dot8_nchw", "depthwise_convolution_quantized.cl" },
+ { "depthwise_convolution_3x3_quantized_dot8_nhwc_stride1", "depthwise_convolution_quantized.cl" },
{ "depthwise_convolution_3x3_stridex1_stridey1_bifrost_f16", "depthwise_convolution.cl" },
{ "depthwise_convolution_3x3_stridex2_stridey2_bifrost_f16", "depthwise_convolution.cl" },
{ "depthwise_convolution_3x3_stridex1_stridey1_bifrost_f32", "depthwise_convolution.cl" },
@@ -810,6 +812,11 @@ Kernel CLKernelLibrary::create_kernel(const std::string &kernel_name, const Stri
concat_str += " -DARM_COMPUTE_OPENCL_DOT8_ENABLED=1 ";
}
+ if(dot8_acc_supported(_device))
+ {
+ concat_str += " -DARM_COMPUTE_OPENCL_DOT8_ACC_ENABLED=1 ";
+ }
+
if(get_cl_version(_device) == CLVersion::CL20)
{
concat_str += " -cl-std=CL2.0 ";