From 905786ea0c1abb2b8df36c56eae93a97823cace1 Mon Sep 17 00:00:00 2001 From: Milos Puzovic Date: Tue, 26 Mar 2024 14:34:30 +0000 Subject: Added new NEON fixed format fast math mode hybrid kernel with maximum height of 6 for accumulation and updated heuristics Change-Id: Ib52ea6825e164f4a8b8422eab7991b50af0b0d7c Signed-off-by: Milos Puzovic Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/11354 Tested-by: Arm Jenkins Reviewed-by: Jakub Sujak Benchmark: Arm Jenkins --- src/BUILD.bazel | 1 + 1 file changed, 1 insertion(+) (limited to 'src/BUILD.bazel') diff --git a/src/BUILD.bazel b/src/BUILD.bazel index d4a3b61836..dd19f38d6d 100644 --- a/src/BUILD.bazel +++ b/src/BUILD.bazel @@ -524,6 +524,7 @@ filegroup( "core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp16_mla_6x32/generic.cpp", "core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32_mla_6x16/generic.cpp", "core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32bf16fp32_mmla_4x24/generic.cpp", + "core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32bf16fp32_mmla_6x16/generic.cpp", "core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_dot_8x12/generic.cpp", "core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_mmla_8x12/generic.cpp", "core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp16_mla_8x24/generic.cpp", -- cgit v1.2.1