diff options
author | SiCong Li <sicong.li@arm.com> | 2023-05-17 13:46:13 +0100 |
---|---|---|
committer | SiCong Li <sicong.li@arm.com> | 2023-05-17 15:20:17 +0000 |
commit | c0463a2959c84e8aa28f39ed2faa035678e682d8 (patch) | |
tree | 3aadfd440b51a919c07517b14a0ae74c83c13033 /src/cpu/kernels/elementwise_unary/generic | |
parent | f15c615e79eb13c7457288e79b8a906bc68dfa1a (diff) | |
download | ComputeLibrary-c0463a2959c84e8aa28f39ed2faa035678e682d8.tar.gz |
Move lut kernel to sve2 category
This specific Lut kernel uses sve2 instructions
Resolves: COMPMID-6268
Signed-off-by: SiCong Li <sicong.li@arm.com>
Change-Id: I44fa3812e96fa79b3d1e1e3a31d587581f59f0e1
Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/9675
Reviewed-by: Viet-Hoa Do <viet-hoa.do@arm.com>
Reviewed-by: Jakub Sujak <jakub.sujak@arm.com>
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Benchmark: Arm Jenkins <bsgcomp@arm.com>
Tested-by: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/cpu/kernels/elementwise_unary/generic')
-rw-r--r-- | src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp (renamed from src/cpu/kernels/elementwise_unary/generic/sve/q8.cpp) | 12 |
1 files changed, 6 insertions, 6 deletions
diff --git a/src/cpu/kernels/elementwise_unary/generic/sve/q8.cpp b/src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp index b68f691086..7e32f50132 100644 --- a/src/cpu/kernels/elementwise_unary/generic/sve/q8.cpp +++ b/src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp @@ -29,23 +29,23 @@ namespace arm_compute { namespace cpu { - -void sve_q8_elementwise_unary(const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) +void sve2_q8_elementwise_unary(const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) { ARM_COMPUTE_UNUSED(op); - auto win = window; + auto win = window; const auto window_end_x = window.x().end(); win.set(0, Window::Dimension(0, 1, 1)); Iterator src_it(in, win); Iterator dst_it(out, win); - execute_window_loop(win, [&](const Coordinates &) { + execute_window_loop(win, [&](const Coordinates &) + { const auto src_ptr = src_it.ptr(); - auto dst_ptr = dst_it.ptr(); + auto dst_ptr = dst_it.ptr(); - lut_u8_sve(lut, 1, window_end_x, &src_ptr, &dst_ptr); + lut_u8_sve2(lut, 1, window_end_x, &src_ptr, &dst_ptr); }, src_it, dst_it); } |