COMPMID-661: QASYMM8 support for fully connected layer.

Change-Id: I70e04d3a175ba366432ada98e9ca893c9f81b260 Reviewed-on: https://eu-gerrit-1.euhpc.arm.com/111094 Reviewed-by: Gian Marco Iodice <gianmarco.iodice@arm.com> Tested-by: BSG Visual Compute Jenkins server to access repositories on http://mpd-gerrit.cambridge.arm.com <bsgcomp@arm.com> Reviewed-by: Anthony Barbier <anthony.barbier@arm.com>
author: Georgios Pinitas <georgios.pinitas@arm.com> 2017-11-29 11:06:49 +0000
committer: Anthony Barbier <anthony.barbier@arm.com> 2018-11-02 16:41:58 +0000
commit: 45bcc3a1c287a208098ae99288273a5129ddd5eb (patch)
tree: f4f957dbc76f8e8e9a4871b16652e1033bcd4c73 /src/core/CL/kernels/CLGEMMLowpOffsetContributionKernel.cpp
parent: 303be90ee1f03f75309b421297ba16428ea98ea5 (diff)
download: ComputeLibrary-45bcc3a1c287a208098ae99288273a5129ddd5eb.tar.gz
1 files changed, 16 insertions, 15 deletions
diff --git a/src/core/CL/kernels/CLGEMMLowpOffsetContributionKernel.cpp b/src/core/CL/kernels/CLGEMMLowpOffsetContributionKernel.cpp
index 96919fe3cb..d49aed3171 100644
--- a/src/core/CL/kernels/CLGEMMLowpOffsetContributionKernel.cpp
+++ b/src/core/CL/kernels/CLGEMMLowpOffsetContributionKernel.cpp
@@ -62,9 +62,6 @@ void CLGEMMLowpOffsetContributionKernel::configure(ICLTensor *mm_result, const I
         ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(vector_sum_col, 1, DataType::S32);
         ARM_COMPUTE_ERROR_ON(vector_sum_col->info()->dimension(0) != mm_result->info()->dimension(0));
 
-        TensorShape vector_sum_col_shape = vector_sum_col->info()->tensor_shape();
-        vector_sum_col_shape.collapse(1);
-
         build_opts.add_option("-DA_OFFSET=" + support::cpp11::to_string(a_offset));
     }
 
@@ -74,21 +71,25 @@ void CLGEMMLowpOffsetContributionKernel::configure(ICLTensor *mm_result, const I
         ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(vector_sum_row, 1, DataType::S32);
         ARM_COMPUTE_ERROR_ON(vector_sum_row->info()->dimension(0) != mm_result->info()->dimension(1));
 
-        TensorShape output_shape         = mm_result->info()->tensor_shape();
-        TensorShape vector_sum_row_shape = vector_sum_row->info()->tensor_shape();
-        vector_sum_row_shape.collapse(1);
-        output_shape.collapse(2);
+        // Validate batches
+        TensorShape output_shape = mm_result->info()->tensor_shape();
+        if(output_shape.num_dimensions() > 1)
+        {
+            TensorShape vector_sum_row_shape = vector_sum_row->info()->tensor_shape();
+            vector_sum_row_shape.collapse_from(1);
+            output_shape.collapse_from(2);
 
-        ARM_COMPUTE_ERROR_ON_MSG(vector_sum_row_shape[1] != output_shape[2], "mm_result tensor must have the same number of batches of output tensor");
+            ARM_COMPUTE_ERROR_ON_MSG(vector_sum_row_shape[1] != output_shape[2], "mm_result tensor must have the same number of batches of output tensor");
 
-        if(a_offset != 0)
-        {
-            TensorShape vector_sum_col_shape = vector_sum_col->info()->tensor_shape();
-            vector_sum_col_shape.collapse(1);
+            if(a_offset != 0)
+            {
+                TensorShape vector_sum_col_shape = vector_sum_col->info()->tensor_shape();
+                vector_sum_col_shape.collapse_from(1);
 
-            ARM_COMPUTE_ERROR_ON_MSG(vector_sum_col_shape[1] != 1
-                                     && vector_sum_col_shape[1] != vector_sum_row_shape[1],
-                                     "vector_sum_col tensor must have the same number of batches of vector_sum_row_shape or the number of batches must be set to 1");
+                ARM_COMPUTE_ERROR_ON_MSG(vector_sum_col_shape[1] != 1
+                                         && vector_sum_col_shape[1] != vector_sum_row_shape[1],
+                                         "vector_sum_col tensor must have the same number of batches of vector_sum_row_shape or the number of batches must be set to 1");
+            }
         }
 
         build_opts.add_option("-DB_OFFSET=" + support::cpp11::to_string(b_offset));
author	Georgios Pinitas <georgios.pinitas@arm.com>	2017-11-29 11:06:49 +0000
committer	Anthony Barbier <anthony.barbier@arm.com>	2018-11-02 16:41:58 +0000
commit	45bcc3a1c287a208098ae99288273a5129ddd5eb (patch)
tree	f4f957dbc76f8e8e9a4871b16652e1033bcd4c73 /src/core/CL/kernels/CLGEMMLowpOffsetContributionKernel.cpp
parent	303be90ee1f03f75309b421297ba16428ea98ea5 (diff)
download	ComputeLibrary-45bcc3a1c287a208098ae99288273a5129ddd5eb.tar.gz