COMPMID-2609: Enable quantization with multiplier greater than 1 on OpenCL

Change-Id: I050f1f84e214e61f7cbb0197a672b68a4940edae Signed-off-by: Michele Di Giorgio <michele.digiorgio@arm.com> Reviewed-on: https://review.mlplatform.org/c/2158 Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Manuel Bottini <manuel.bottini@arm.com> Tested-by: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Giorgio Arena <giorgio.arena@arm.com>
author: Michele Di Giorgio <michele.digiorgio@arm.com> 2019-10-23 10:53:10 +0100
committer: Michele Di Giorgio <michele.digiorgio@arm.com> 2019-11-28 10:02:15 +0000
commit: 14cbfb2921990d8bf125231e350e2ac8dcd95a8b (patch)
tree: 9bec073d72c44c480c8807601889481d9b89ee7e /src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp
parent: ed7b27dd7cbdae57b880029840ad0235523848e0 (diff)
download: ComputeLibrary-14cbfb2921990d8bf125231e350e2ac8dcd95a8b.tar.gz
1 files changed, 20 insertions, 0 deletions
diff --git a/src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp b/src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp
index 3fc236eaa7..2155306d62 100644
--- a/src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp
+++ b/src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp
@@ -107,6 +107,18 @@ Status validate_arguments(const ITensorInfo *input, const ITensorInfo *weights,
         ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DIMENSIONS(output->tensor_shape(), output_shape);
     }
 
+    if(is_data_type_quantized(input->data_type()))
+    {
+        const UniformQuantizationInfo iq_info = input->quantization_info().uniform();
+        const UniformQuantizationInfo wq_info = weights->quantization_info().uniform();
+        const UniformQuantizationInfo oq_info = (output->total_size() != 0) ? output->quantization_info().uniform() : iq_info;
+
+        float multiplier        = iq_info.scale * wq_info.scale / oq_info.scale;
+        int   output_multiplier = 0;
+        int   output_shift      = 0;
+        ARM_COMPUTE_RETURN_ON_ERROR(quantization::calculate_quantized_multiplier(multiplier, &output_multiplier, &output_shift));
+    }
+
     return Status{};
 }
 
@@ -236,6 +248,14 @@ void CLDepthwiseConvolutionLayerNativeKernel::configure(const ICLTensor *input,
         build_opts.add_option("-DOUTPUT_OFFSET=" + support::cpp11::to_string(oq_info.offset));
         build_opts.add_option_if(is_data_type_quantized_per_channel(weights->info()->data_type()), "-DPER_CHANNEL_QUANTIZATION");
 
+        // Compute non-per-channel multiplier and shift anyway to make OpenCL kernel simpler
+        float multiplier        = iq_info.scale * wq_info.scale / oq_info.scale;
+        int   output_multiplier = 0;
+        int   output_shift      = 0;
+        quantization::calculate_quantized_multiplier(multiplier, &output_multiplier, &output_shift);
+        build_opts.add_option("-DOUTPUT_MULTIPLIER=" + support::cpp11::to_string(output_multiplier));
+        build_opts.add_option("-DOUTPUT_SHIFT=" + support::cpp11::to_string(output_shift));
+
         if(dwc_info.activation_info.enabled())
         {
             const int a_val = quantize_qasymm8(dwc_info.activation_info.a(), oq_info);
author	Michele Di Giorgio <michele.digiorgio@arm.com>	2019-10-23 10:53:10 +0100
committer	Michele Di Giorgio <michele.digiorgio@arm.com>	2019-11-28 10:02:15 +0000
commit	14cbfb2921990d8bf125231e350e2ac8dcd95a8b (patch)
tree	9bec073d72c44c480c8807601889481d9b89ee7e /src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp
parent	ed7b27dd7cbdae57b880029840ad0235523848e0 (diff)
download	ComputeLibrary-14cbfb2921990d8bf125231e350e2ac8dcd95a8b.tar.gz