From d7154dbf0f4a347f2f35f2475a893f1631c5ee1a Mon Sep 17 00:00:00 2001 From: Dana Zlotnik Date: Wed, 10 Nov 2021 11:50:58 +0200 Subject: Implement 1D Adaptive Workload Splitting in CPPScheduler Resolves COMPMID-4649 Change-Id: I941d2f8a40737ff05c49f6695a42884731ef2dc9 Signed-off-by: Dana Zlotnik Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/6656 Tested-by: Arm Jenkins Reviewed-by: SiCong Li Comments-Addressed: Arm Jenkins --- src/core/NEON/kernels/NEPadLayerKernel.cpp | 13 ++++++++++--- 1 file changed, 10 insertions(+), 3 deletions(-) (limited to 'src/core/NEON/kernels/NEPadLayerKernel.cpp') diff --git a/src/core/NEON/kernels/NEPadLayerKernel.cpp b/src/core/NEON/kernels/NEPadLayerKernel.cpp index 60986812be..2e5e9f76be 100644 --- a/src/core/NEON/kernels/NEPadLayerKernel.cpp +++ b/src/core/NEON/kernels/NEPadLayerKernel.cpp @@ -261,9 +261,16 @@ void NEPadLayerKernel::run(const Window &window, const ThreadInfo &info) size_t NEPadLayerKernel::get_mws(const CPUInfo &platform, size_t thread_count) const { - ARM_COMPUTE_UNUSED(platform, thread_count); - - return ICPPKernel::small_network_mws; + ARM_COMPUTE_UNUSED(thread_count); + // Tuning results that gave optimized results in performance investigation + if (platform.get_cpu_model() == CPUModel::A73 ) + { + return 10240; + } + else + { + return 9216; + } } } // namespace arm_compute -- cgit v1.2.1