aboutsummaryrefslogtreecommitdiff
path: root/src/core/NEON/kernels/NEReductionOperationKernel.cpp
diff options
context:
space:
mode:
authorUsama Arif <usama.arif@arm.com>2019-05-23 14:20:33 +0100
committerUsama Arif <usama.arif@arm.com>2019-05-24 16:11:16 +0000
commit0a5a57a3f794de851408bae1c63b1660b4c5cbe7 (patch)
tree5d49d85165a3d9fd257c5676691fc5ae24fda4f3 /src/core/NEON/kernels/NEReductionOperationKernel.cpp
parent43c1bf8e47098d6ab07be5b5e685bda6d8b80344 (diff)
downloadComputeLibrary-0a5a57a3f794de851408bae1c63b1660b4c5cbe7.tar.gz
COMPMID-2160: Implement Round for NEON
Change-Id: Ie80e2ad294eaf95bc823d979842c320e8fb41f67 Signed-off-by: Usama Arif <usama.arif@arm.com> Reviewed-on: https://review.mlplatform.org/c/1215 Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Reviewed-by: Georgios Pinitas <georgios.pinitas@arm.com> Tested-by: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/core/NEON/kernels/NEReductionOperationKernel.cpp')
-rw-r--r--src/core/NEON/kernels/NEReductionOperationKernel.cpp2
1 files changed, 2 insertions, 0 deletions
diff --git a/src/core/NEON/kernels/NEReductionOperationKernel.cpp b/src/core/NEON/kernels/NEReductionOperationKernel.cpp
index e6edf22083..c6e853659c 100644
--- a/src/core/NEON/kernels/NEReductionOperationKernel.cpp
+++ b/src/core/NEON/kernels/NEReductionOperationKernel.cpp
@@ -180,6 +180,7 @@ inline uint8x8_t calculate_max(uint8x16_t in)
return wrapper::vpmax(pmax, pmax);
}
+template <>
uint32_t calculate_vector_index(uint32x4x4_t vec_res_idx, uint8x16_t vec_res_value, ReductionOperation op)
{
uint32x4x4_t res_idx_mask{ { 0 } };
@@ -272,6 +273,7 @@ inline float16x4_t calculate_max(float16x8_t in)
return wrapper::vpmax(pmax, pmax);
}
+template <>
uint32_t calculate_vector_index(uint32x4x4_t vec_res_idx, float16x8_t vec_res_value, ReductionOperation op)
{
uint32x4x2_t res_idx_mask{ 0 };