aboutsummaryrefslogtreecommitdiff
path: root/src/core/CL/CLKernelLibrary.cpp
diff options
context:
space:
mode:
authorSiCong Li <sicong.li@arm.com>2020-10-28 14:19:28 +0000
committerSiCong Li <sicong.li@arm.com>2020-11-05 11:20:58 +0000
commit4abc9d1a842e90162afe5349e3d51298fa0b8af4 (patch)
tree9e6745f75b39cdcc8f15fc56c260ad5eded23d36 /src/core/CL/CLKernelLibrary.cpp
parent770dfeb04b6fd89afde2005bd46caa6ff0858f3e (diff)
downloadComputeLibrary-4abc9d1a842e90162afe5349e3d51298fa0b8af4.tar.gz
COMPMID-3730 Remove padding from CLGEMMMatrixMultiplyKernel Patch1
* Remove default definition for STORE_BLOCK_BOUNDARY_AWARE to avoid elusive bugs * Clean up gemm_mm_interleaved* and gemm_mm_floating_point* kernels * Relocate to gemm_v1.cl to avoid clashing with new kernels * Rename compile time arguments to conform with the established terminology(MNKB), and to facilitate the use of STORE_BLOCK_BOUNDARY_AWARE Change-Id: Ia85c746b2536cad87257a79685b459b5d2f9a1be Signed-off-by: SiCong Li <sicong.li@arm.com> Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/4329 Tested-by: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Gian Marco Iodice <gianmarco.iodice@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/core/CL/CLKernelLibrary.cpp')
-rw-r--r--src/core/CL/CLKernelLibrary.cpp24
1 files changed, 14 insertions, 10 deletions
diff --git a/src/core/CL/CLKernelLibrary.cpp b/src/core/CL/CLKernelLibrary.cpp
index 8c5607eebc..33f0da0aa1 100644
--- a/src/core/CL/CLKernelLibrary.cpp
+++ b/src/core/CL/CLKernelLibrary.cpp
@@ -206,16 +206,16 @@ const std::map<std::string, std::string> CLKernelLibrary::_kernel_program_map =
{ "gemm_ma_f32", "gemm.cl" },
{ "gemm_mv", "gemv.cl" },
{ "gemm_mv_quantized", "gemv.cl" },
- { "gemm_mm_interleaved_transposed_f16", "gemm.cl" },
- { "gemm_mm_interleaved_transposed_f16_acc32", "gemm.cl" },
- { "gemm_mm_interleaved_transposed_f16_bifrost", "gemm.cl" },
- { "gemm_mm_interleaved_transposed_f32", "gemm.cl" },
- { "gemm_mm_interleaved_transposed_f32_bifrost", "gemm.cl" },
- { "gemm_mm_floating_point", "gemm.cl" },
- { "gemm_mm_floating_point_f16_bifrost", "gemm.cl" },
- { "gemm_mm_floating_point_f16_bifrost_acc32", "gemm.cl" },
- { "gemm_mm_floating_point_f32_bifrost", "gemm.cl" },
- { "gemm_mm_floating_point_f32_bifrost_1000", "gemm.cl" },
+ { "gemm_mm_interleaved_transposed_f16", "gemm_v1.cl" },
+ { "gemm_mm_interleaved_transposed_f16_acc32", "gemm_v1.cl" },
+ { "gemm_mm_interleaved_transposed_f16_bifrost", "gemm_v1.cl" },
+ { "gemm_mm_interleaved_transposed_f32", "gemm_v1.cl" },
+ { "gemm_mm_interleaved_transposed_f32_bifrost", "gemm_v1.cl" },
+ { "gemm_mm_floating_point", "gemm_v1.cl" },
+ { "gemm_mm_floating_point_f16_bifrost", "gemm_v1.cl" },
+ { "gemm_mm_floating_point_f16_bifrost_acc32", "gemm_v1.cl" },
+ { "gemm_mm_floating_point_f32_bifrost", "gemm_v1.cl" },
+ { "gemm_mm_floating_point_f32_bifrost_1000", "gemm_v1.cl" },
{ "gemm_mm_native", "gemm.cl" },
{ "gemm_mm_reshaped_lhs_nt_rhs_t", "gemm.cl" },
{ "gemm_mm_reshaped_lhs_nt_rhs_t_texture", "gemm.cl" },
@@ -690,6 +690,10 @@ const std::map<std::string, std::string> CLKernelLibrary::_program_source_map =
#include "./cl_kernels/gemm.clembed"
},
{
+ "gemm_v1.cl",
+#include "./cl_kernels/gemm_v1.clembed"
+ },
+ {
"gemmlowp.cl",
#include "./cl_kernels/gemmlowp.clembed"
},