diff options
Diffstat (limited to 'src/cpu/kernels')
-rw-r--r-- | src/cpu/kernels/CpuActivationKernel.cpp | 8 | ||||
-rw-r--r-- | src/cpu/kernels/CpuElementwiseUnaryKernel.cpp | 6 | ||||
-rw-r--r-- | src/cpu/kernels/activation/generic/sve2/lut.cpp (renamed from src/cpu/kernels/activation/generic/sve/lut.cpp) | 4 | ||||
-rw-r--r-- | src/cpu/kernels/activation/list.h | 4 | ||||
-rw-r--r-- | src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp (renamed from src/cpu/kernels/elementwise_unary/generic/sve/q8.cpp) | 12 | ||||
-rw-r--r-- | src/cpu/kernels/elementwise_unary/list.h | 2 | ||||
-rw-r--r-- | src/cpu/kernels/lut/generic/sve2/u8.cpp (renamed from src/cpu/kernels/lut/generic/sve/u8.cpp) | 3 | ||||
-rw-r--r-- | src/cpu/kernels/lut/list.h | 2 |
8 files changed, 20 insertions, 21 deletions
diff --git a/src/cpu/kernels/CpuActivationKernel.cpp b/src/cpu/kernels/CpuActivationKernel.cpp index 04a9731f4a..20a8489cdd 100644 --- a/src/cpu/kernels/CpuActivationKernel.cpp +++ b/src/cpu/kernels/CpuActivationKernel.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2017-2022 Arm Limited. + * Copyright (c) 2017-2023 Arm Limited. * * SPDX-License-Identifier: MIT * @@ -47,9 +47,9 @@ static const std::vector<CpuActivationKernel::ActivationKernel> available_kernel { #ifdef ARM_COMPUTE_ENABLE_SVE { - "sve_q8_activation_lut", - [](const ActivationDataTypeISASelectorData & data) { return ActivationLayerInfo::is_lut_supported(data.f, data.dt) && data.cpumodel == CPUModel::A510 && data.isa.sve; }, - REGISTER_QASYMM8_SVE(arm_compute::cpu::sve_q8_activation_lut) + "sve2_q8_activation_lut", + [](const ActivationDataTypeISASelectorData & data) { return ActivationLayerInfo::is_lut_supported(data.f, data.dt) && data.cpumodel == CPUModel::A510 && data.isa.sve2; }, + REGISTER_QASYMM8_SVE2(arm_compute::cpu::sve2_q8_activation_lut) }, #endif // ARM_COMPUTE_ENABLE_SVE #ifdef __aarch64__ diff --git a/src/cpu/kernels/CpuElementwiseUnaryKernel.cpp b/src/cpu/kernels/CpuElementwiseUnaryKernel.cpp index dbb752aef3..04a7f15715 100644 --- a/src/cpu/kernels/CpuElementwiseUnaryKernel.cpp +++ b/src/cpu/kernels/CpuElementwiseUnaryKernel.cpp @@ -167,12 +167,12 @@ static const std::vector<CpuElementwiseUnaryKernel::ElementwiseUnaryKernel> avai }, #ifdef __aarch64__ { - "sve_q8_elementwise_unary", + "sve2_q8_elementwise_unary", [](const DataTypeISASelectorData & data) { - return (data.dt == DataType::QASYMM8 || data.dt == DataType::QASYMM8_SIGNED) && data.isa.sve; + return (data.dt == DataType::QASYMM8 || data.dt == DataType::QASYMM8_SIGNED) && data.isa.sve2; }, - REGISTER_QASYMM8_SVE(sve_q8_elementwise_unary), + REGISTER_QASYMM8_SVE2(sve2_q8_elementwise_unary), &q8_prepare_lut, }, { diff --git a/src/cpu/kernels/activation/generic/sve/lut.cpp b/src/cpu/kernels/activation/generic/sve2/lut.cpp index b4042662b9..2e5975744b 100644 --- a/src/cpu/kernels/activation/generic/sve/lut.cpp +++ b/src/cpu/kernels/activation/generic/sve2/lut.cpp @@ -30,7 +30,7 @@ namespace arm_compute namespace cpu { #ifdef __aarch64__ -void sve_q8_activation_lut(const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) +void sve2_q8_activation_lut(const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) { ARM_COMPUTE_ERROR_ON(!ActivationLayerInfo::is_lut_supported(act_info.activation(), src->info()->data_type())); const auto window_end_x = window.x().end(); @@ -42,7 +42,7 @@ void sve_q8_activation_lut(const ITensor *src, ITensor *dst, const ActivationLay { const auto input_ptr = input.ptr(); auto output_ptr = output.ptr(); - lut_u8_sve(act_info.lut().data(), 1u, window_end_x, &input_ptr, &output_ptr); + lut_u8_sve2(act_info.lut().data(), 1u, window_end_x, &input_ptr, &output_ptr); }, input, output); } diff --git a/src/cpu/kernels/activation/list.h b/src/cpu/kernels/activation/list.h index c2149b38ff..6550ddfeca 100644 --- a/src/cpu/kernels/activation/list.h +++ b/src/cpu/kernels/activation/list.h @@ -1,5 +1,5 @@ /* - * Copyright (c) 2020-2022 Arm Limited. + * Copyright (c) 2020-2023 Arm Limited. * * SPDX-License-Identifier: MIT * @@ -34,7 +34,7 @@ namespace cpu #ifdef __aarch64__ DECLARE_ACTIVATION_KERNEL(neon_q8_activation_lut); #endif // __aarch64__ -DECLARE_ACTIVATION_KERNEL(sve_q8_activation_lut); +DECLARE_ACTIVATION_KERNEL(sve2_q8_activation_lut); DECLARE_ACTIVATION_KERNEL(neon_qasymm8_activation); DECLARE_ACTIVATION_KERNEL(sve2_qasymm8_activation); DECLARE_ACTIVATION_KERNEL(neon_qasymm8_signed_activation); diff --git a/src/cpu/kernels/elementwise_unary/generic/sve/q8.cpp b/src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp index b68f691086..7e32f50132 100644 --- a/src/cpu/kernels/elementwise_unary/generic/sve/q8.cpp +++ b/src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp @@ -29,23 +29,23 @@ namespace arm_compute { namespace cpu { - -void sve_q8_elementwise_unary(const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) +void sve2_q8_elementwise_unary(const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) { ARM_COMPUTE_UNUSED(op); - auto win = window; + auto win = window; const auto window_end_x = window.x().end(); win.set(0, Window::Dimension(0, 1, 1)); Iterator src_it(in, win); Iterator dst_it(out, win); - execute_window_loop(win, [&](const Coordinates &) { + execute_window_loop(win, [&](const Coordinates &) + { const auto src_ptr = src_it.ptr(); - auto dst_ptr = dst_it.ptr(); + auto dst_ptr = dst_it.ptr(); - lut_u8_sve(lut, 1, window_end_x, &src_ptr, &dst_ptr); + lut_u8_sve2(lut, 1, window_end_x, &src_ptr, &dst_ptr); }, src_it, dst_it); } diff --git a/src/cpu/kernels/elementwise_unary/list.h b/src/cpu/kernels/elementwise_unary/list.h index 432fabf4af..a9701afdd8 100644 --- a/src/cpu/kernels/elementwise_unary/list.h +++ b/src/cpu/kernels/elementwise_unary/list.h @@ -37,7 +37,7 @@ namespace cpu DECLARE_ELEMETWISE_UNARY_KERNEL(sve_fp32_elementwise_unary); DECLARE_ELEMETWISE_UNARY_KERNEL(sve_fp16_elementwise_unary); DECLARE_ELEMETWISE_UNARY_KERNEL(sve_s32_elementwise_unary); -DECLARE_ELEMETWISE_UNARY_KERNEL(sve_q8_elementwise_unary); +DECLARE_ELEMETWISE_UNARY_KERNEL(sve2_q8_elementwise_unary); DECLARE_ELEMETWISE_UNARY_KERNEL(neon_fp32_elementwise_unary); DECLARE_ELEMETWISE_UNARY_KERNEL(neon_fp16_elementwise_unary); DECLARE_ELEMETWISE_UNARY_KERNEL(neon_s32_elementwise_unary); diff --git a/src/cpu/kernels/lut/generic/sve/u8.cpp b/src/cpu/kernels/lut/generic/sve2/u8.cpp index 70f3a2e6fb..b80d75326e 100644 --- a/src/cpu/kernels/lut/generic/sve/u8.cpp +++ b/src/cpu/kernels/lut/generic/sve2/u8.cpp @@ -31,8 +31,7 @@ namespace arm_compute { namespace cpu { - -void lut_u8_sve( +void lut_u8_sve2( const uint8_t *table, size_t num_strings, size_t string_length, diff --git a/src/cpu/kernels/lut/list.h b/src/cpu/kernels/lut/list.h index 9749b91cfe..7a2afc6927 100644 --- a/src/cpu/kernels/lut/list.h +++ b/src/cpu/kernels/lut/list.h @@ -43,7 +43,7 @@ namespace cpu uint8_t *const *output) DECLARE_LUT_KERNEL(lut_u8_neon); -DECLARE_LUT_KERNEL(lut_u8_sve); +DECLARE_LUT_KERNEL(lut_u8_sve2); #undef DECLARE_LUT_KERNEL #endif // __aarch64__ |