Optimize int8 arithmetic addition on CPU

Avoid accessing quantization info from TensorInfo in leftover loop. Use the already available UniformQuantizationInfo instead Create another version of the quantize utility function which assumes RoundingPolicy::TO_NEAREST_UP. This allows us to call std::lround() and avoid some overhead Resolve COMPMID-4546 Signed-off-by: Giorgio Arena <giorgio.arena@arm.com> Change-Id: Ib481a586f879b7e937e3d54ba11100d0a37ef277 Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/5722 Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Michele Di Giorgio <michele.digiorgio@arm.com> Tested-by: Arm Jenkins <bsgcomp@arm.com>
author: Giorgio Arena <giorgio.arena@arm.com> 2021-05-26 15:32:50 +0100
committer: Giorgio Arena <giorgio.arena@arm.com> 2021-06-01 11:27:17 +0000
commit: 433ea4981675b64c44c8f47f2f4aac6bfcbfc911 (patch)
tree: 7f73bdb5f7c068bd2d6849ae615447e8ea93843f /arm_compute/core/QuantizationInfo.h
parent: b3be45759bdd0749ae3a16fe470820f0d9830ea9 (diff)
download: ComputeLibrary-433ea4981675b64c44c8f47f2f4aac6bfcbfc911.tar.gz
1 files changed, 24 insertions, 4 deletions
diff --git a/arm_compute/core/QuantizationInfo.h b/arm_compute/core/QuantizationInfo.h
index af7b8c66d8..b331f7d923 100644
--- a/arm_compute/core/QuantizationInfo.h
+++ b/arm_compute/core/QuantizationInfo.h
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2020 Arm Limited.
+ * Copyright (c) 2019-2021 Arm Limited.
  *
  * SPDX-License-Identifier: MIT
  *
@@ -24,9 +24,10 @@
 #ifndef ARM_COMPUTE_QUANTIZATION_INFO_H
 #define ARM_COMPUTE_QUANTIZATION_INFO_H
 
+#include "arm_compute/core/Error.h"
 #include "arm_compute/core/Rounding.h"
+#include "support/ToolchainSupport.h"
 #include "utils/misc/Utility.h"
-#include "arm_compute/core/Error.h"
 
 #include <cstddef>
 #include <type_traits>
@@ -216,14 +217,33 @@ struct Qasymm8QuantizationHelper
 
     /** Quantize a value given a 8-bit asymmetric quantization scheme
      *
+     * @param[in] value Value to quantize
+     * @param[in] qinfo Quantization information to use for quantizing
+     *
+     * @return Quantized value
+     */
+    static inline QUANTIZED_TYPE quantize(float value, const UniformQuantizationInfo &qinfo)
+    {
+        ARM_COMPUTE_ERROR_ON(qinfo.scale == 0);
+        const int quantized = support::cpp11::lround(value / qinfo.scale) + qinfo.offset;
+        return static_cast<QUANTIZED_TYPE>(arm_compute::utility::clamp<decltype(quantized), QUANTIZED_TYPE>(quantized));
+    }
+
+    /** Quantize a value given a 8-bit asymmetric quantization scheme using a specific rounding policy
+     *
      * @param[in] value           Value to quantize
      * @param[in] qinfo           Quantization information to use for quantizing
-     * @param[in] rounding_policy (Optional) Rounding policy to use. Default: nearest up
+     * @param[in] rounding_policy Rounding policy to use
      *
      * @return Quantized value
      */
-    static inline QUANTIZED_TYPE quantize(float value, const UniformQuantizationInfo &qinfo, RoundingPolicy rounding_policy = RoundingPolicy::TO_NEAREST_UP)
+    static inline QUANTIZED_TYPE quantize(float value, const UniformQuantizationInfo &qinfo, RoundingPolicy rounding_policy)
     {
+        if(rounding_policy == RoundingPolicy::TO_NEAREST_UP)
+        {
+            return quantize(value, qinfo);
+        }
+
         ARM_COMPUTE_ERROR_ON(qinfo.scale == 0);
         const int quantized = arm_compute::round(value / qinfo.scale, rounding_policy) + qinfo.offset;
         return static_cast<QUANTIZED_TYPE>(arm_compute::utility::clamp<decltype(quantized), QUANTIZED_TYPE>(quantized));
author	Giorgio Arena <giorgio.arena@arm.com>	2021-05-26 15:32:50 +0100
committer	Giorgio Arena <giorgio.arena@arm.com>	2021-06-01 11:27:17 +0000
commit	433ea4981675b64c44c8f47f2f4aac6bfcbfc911 (patch)
tree	7f73bdb5f7c068bd2d6849ae615447e8ea93843f /arm_compute/core/QuantizationInfo.h
parent	b3be45759bdd0749ae3a16fe470820f0d9830ea9 (diff)
download	ComputeLibrary-433ea4981675b64c44c8f47f2f4aac6bfcbfc911.tar.gz