diff options
author | SiCong Li <sicong.li@arm.com> | 2020-10-28 14:19:28 +0000 |
---|---|---|
committer | SiCong Li <sicong.li@arm.com> | 2020-11-05 11:20:58 +0000 |
commit | 4abc9d1a842e90162afe5349e3d51298fa0b8af4 (patch) | |
tree | 9e6745f75b39cdcc8f15fc56c260ad5eded23d36 /src/core/CL/CLKernelLibrary.cpp | |
parent | 770dfeb04b6fd89afde2005bd46caa6ff0858f3e (diff) | |
download | ComputeLibrary-4abc9d1a842e90162afe5349e3d51298fa0b8af4.tar.gz |
COMPMID-3730 Remove padding from CLGEMMMatrixMultiplyKernel Patch1
* Remove default definition for STORE_BLOCK_BOUNDARY_AWARE to avoid elusive bugs
* Clean up gemm_mm_interleaved* and gemm_mm_floating_point* kernels
* Relocate to gemm_v1.cl to avoid clashing with new kernels
* Rename compile time arguments to conform with the established
terminology(MNKB), and to facilitate the use of STORE_BLOCK_BOUNDARY_AWARE
Change-Id: Ia85c746b2536cad87257a79685b459b5d2f9a1be
Signed-off-by: SiCong Li <sicong.li@arm.com>
Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/4329
Tested-by: Arm Jenkins <bsgcomp@arm.com>
Reviewed-by: Gian Marco Iodice <gianmarco.iodice@arm.com>
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/core/CL/CLKernelLibrary.cpp')
-rw-r--r-- | src/core/CL/CLKernelLibrary.cpp | 24 |
1 files changed, 14 insertions, 10 deletions
diff --git a/src/core/CL/CLKernelLibrary.cpp b/src/core/CL/CLKernelLibrary.cpp index 8c5607eebc..33f0da0aa1 100644 --- a/src/core/CL/CLKernelLibrary.cpp +++ b/src/core/CL/CLKernelLibrary.cpp @@ -206,16 +206,16 @@ const std::map<std::string, std::string> CLKernelLibrary::_kernel_program_map = { "gemm_ma_f32", "gemm.cl" }, { "gemm_mv", "gemv.cl" }, { "gemm_mv_quantized", "gemv.cl" }, - { "gemm_mm_interleaved_transposed_f16", "gemm.cl" }, - { "gemm_mm_interleaved_transposed_f16_acc32", "gemm.cl" }, - { "gemm_mm_interleaved_transposed_f16_bifrost", "gemm.cl" }, - { "gemm_mm_interleaved_transposed_f32", "gemm.cl" }, - { "gemm_mm_interleaved_transposed_f32_bifrost", "gemm.cl" }, - { "gemm_mm_floating_point", "gemm.cl" }, - { "gemm_mm_floating_point_f16_bifrost", "gemm.cl" }, - { "gemm_mm_floating_point_f16_bifrost_acc32", "gemm.cl" }, - { "gemm_mm_floating_point_f32_bifrost", "gemm.cl" }, - { "gemm_mm_floating_point_f32_bifrost_1000", "gemm.cl" }, + { "gemm_mm_interleaved_transposed_f16", "gemm_v1.cl" }, + { "gemm_mm_interleaved_transposed_f16_acc32", "gemm_v1.cl" }, + { "gemm_mm_interleaved_transposed_f16_bifrost", "gemm_v1.cl" }, + { "gemm_mm_interleaved_transposed_f32", "gemm_v1.cl" }, + { "gemm_mm_interleaved_transposed_f32_bifrost", "gemm_v1.cl" }, + { "gemm_mm_floating_point", "gemm_v1.cl" }, + { "gemm_mm_floating_point_f16_bifrost", "gemm_v1.cl" }, + { "gemm_mm_floating_point_f16_bifrost_acc32", "gemm_v1.cl" }, + { "gemm_mm_floating_point_f32_bifrost", "gemm_v1.cl" }, + { "gemm_mm_floating_point_f32_bifrost_1000", "gemm_v1.cl" }, { "gemm_mm_native", "gemm.cl" }, { "gemm_mm_reshaped_lhs_nt_rhs_t", "gemm.cl" }, { "gemm_mm_reshaped_lhs_nt_rhs_t_texture", "gemm.cl" }, @@ -690,6 +690,10 @@ const std::map<std::string, std::string> CLKernelLibrary::_program_source_map = #include "./cl_kernels/gemm.clembed" }, { + "gemm_v1.cl", +#include "./cl_kernels/gemm_v1.clembed" + }, + { "gemmlowp.cl", #include "./cl_kernels/gemmlowp.clembed" }, |