aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGian Marco Iodice <gianmarco.iodice@arm.com>2019-06-13 15:58:32 +0100
committerGian Marco Iodice <gianmarco.iodice@arm.com>2019-06-14 09:51:57 +0000
commit2b52add96d7eced9eec36d526b800e2bc269984f (patch)
treeb230b87c8722d4bfb4f844562d0948b95d364b7b
parent2732cca12bac29e1515cee1db5005c73893c61b4 (diff)
downloadComputeLibrary-2b52add96d7eced9eec36d526b800e2bc269984f.tar.gz
COMPMID-2405: Add lws_hint to CLGEMMLowpMatrixAReductionKernel
Change-Id: Ie194e6df5db07d37b15d735e15856bf02d441360 Signed-off-by: Gian Marco Iodice <gianmarco.iodice@arm.com> Reviewed-on: https://review.mlplatform.org/c/1338 Tested-by: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Michele Di Giorgio <michele.digiorgio@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
-rw-r--r--src/core/CL/kernels/CLGEMMLowpReductionKernel.cpp12
1 files changed, 10 insertions, 2 deletions
diff --git a/src/core/CL/kernels/CLGEMMLowpReductionKernel.cpp b/src/core/CL/kernels/CLGEMMLowpReductionKernel.cpp
index 225c358b20..e878dbcdcd 100644
--- a/src/core/CL/kernels/CLGEMMLowpReductionKernel.cpp
+++ b/src/core/CL/kernels/CLGEMMLowpReductionKernel.cpp
@@ -1,5 +1,5 @@
/*
- * Copyright (c) 2017-2018 ARM Limited.
+ * Copyright (c) 2017-2019 ARM Limited.
*
* SPDX-License-Identifier: MIT
*
@@ -127,6 +127,14 @@ void CLGEMMLowpMatrixAReductionKernel::configure(const ICLTensor *mtx_a, ICLTens
auto win_config = validate_and_configure_window_matrix_a_reduction(_input->info(), _output->info());
ARM_COMPUTE_ERROR_THROW_ON(win_config.first);
ICLKernel::configure_internal(win_config.second);
+
+ _config_id = kernel_name;
+ _config_id += "_";
+ _config_id += support::cpp11::to_string(_input->info()->dimension(0));
+ _config_id += "_";
+ _config_id += support::cpp11::to_string(_input->info()->dimension(1));
+ _config_id += "_";
+ _config_id += support::cpp11::to_string(_input->info()->dimension(2));
}
Status CLGEMMLowpMatrixAReductionKernel::validate(const ITensorInfo *mtx_a, const ITensorInfo *vector_sum_row)
@@ -156,7 +164,7 @@ void CLGEMMLowpMatrixAReductionKernel::run(const Window &window, cl::CommandQueu
unsigned int idx = 0;
add_3D_tensor_argument(idx, _input, slice_in);
add_2D_tensor_argument(idx, _output, slice_out);
- enqueue(queue, *this, slice_out);
+ enqueue(queue, *this, slice_out, lws_hint());
}
while(collapsed.slide_window_slice_2D(slice_out));
}