From 70eb53b09adf57cc6ff7435c795e65a4f4697f67 Mon Sep 17 00:00:00 2001 From: Georgios Pinitas Date: Wed, 6 Jan 2021 19:42:21 +0000 Subject: Make CpuFloorKernel kernel stateless - Rename NEFloorKernel to CpuFloorKernel to accomodate new ISA implementations - Remove state and instead pass tensors to operate during run - Add member function to generate an execution window given an input and output tensor description Signed-off-by: Georgios Pinitas Change-Id: I9240b8ec534589c0f15c354f771f1ac5d7010c3b Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/4773 Comments-Addressed: Arm Jenkins Tested-by: Arm Jenkins Reviewed-by: Michalis Spyrou --- src/core/NEON/kernels/NEElementwiseUnaryKernel.cpp | 13 ++++++------- 1 file changed, 6 insertions(+), 7 deletions(-) (limited to 'src/core/NEON/kernels/NEElementwiseUnaryKernel.cpp') diff --git a/src/core/NEON/kernels/NEElementwiseUnaryKernel.cpp b/src/core/NEON/kernels/NEElementwiseUnaryKernel.cpp index ed1cb6fca4..fdd2aabf60 100644 --- a/src/core/NEON/kernels/NEElementwiseUnaryKernel.cpp +++ b/src/core/NEON/kernels/NEElementwiseUnaryKernel.cpp @@ -31,7 +31,6 @@ #include "src/core/NEON/kernels/elementwise/impl/elementwise_unary_list.h" #include "src/core/SVE/kernels/elementwise/impl/elementwise_unary_list.h" #include "src/core/common/Registrars.h" -#include "src/core/common/StdTypes.h" #include "src/core/helpers/AutoConfiguration.h" #include "src/core/helpers/WindowHelpers.h" #include "support/ToolchainSupport.h" @@ -55,35 +54,35 @@ static const ElementwiseUnaryKernel available_kernels[] = { "fp32_sve_elementwise_unary", [](DataType dt) { return dt == DataType::F32; }, - REGISTER_FP32_SVE(arm_compute::cpu::elementwise_sve_op), + REGISTER_FP32_SVE(arm_compute::cpu::elementwise_sve_op), }, { "fp16_sve_elementwise_unary", [](DataType dt) { return dt == DataType::F16; }, - REGISTER_FP16_SVE(arm_compute::cpu::elementwise_sve_op), + REGISTER_FP16_SVE(arm_compute::cpu::elementwise_sve_op<__fp16>), }, { "s32_sve_elementwise_unary", [](DataType dt) { return dt == DataType::S32; }, - REGISTER_INTEGER_SVE(arm_compute::cpu::elementwise_sve_op), + REGISTER_INTEGER_SVE(arm_compute::cpu::elementwise_sve_op), }, #endif // defined(__ARM_FEATURE_SVE) { "fp32_neon_elementwise_unary", [](DataType dt) { return dt == DataType::F32; }, - REGISTER_FP32_NEON(arm_compute::cpu::elementwise_op), + REGISTER_FP32_NEON(arm_compute::cpu::elementwise_op), }, #if defined(__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) { "fp16_neon_elementwise_unary", [](DataType dt) { return dt == DataType::F16; }, - REGISTER_FP32_NEON(arm_compute::cpu::elementwise_op), + REGISTER_FP32_NEON(arm_compute::cpu::elementwise_op<__fp16>), }, #endif // defined(__ARM_FEATURE_FP16_VECTOR_ARITHMETIC) { "s32_neon_elementwise_unary", [](DataType dt) { return dt == DataType::S32; }, - REGISTER_INTEGER_NEON(arm_compute::cpu::elementwise_op), + REGISTER_INTEGER_NEON(arm_compute::cpu::elementwise_op), }, }; -- cgit v1.2.1