From e7280585b317f695a932be5981895377e174946d Mon Sep 17 00:00:00 2001 From: Sang-Hoon Park Date: Tue, 13 Oct 2020 23:34:09 +0100 Subject: COMPMID-3805: Fix SQRT non-zero output for zero input - For AArch64, NEActivationLayerKernel uses vsqrt rather than vinvsqrt. - For non-AArch64, it masks values to ensure zero input results in zero output without producing NaN. - Test cases for FP16 and FP32's positive boundary values are added. Change-Id: Ic0104ee5d7045059c2e9bd052616a4a3b43a315d Signed-off-by: Sang-Hoon Park Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/4150 Comments-Addressed: Arm Jenkins Tested-by: Arm Jenkins Reviewed-by: Georgios Pinitas --- src/core/NEON/wrapper/intrinsics/intrinsics.h | 1 + 1 file changed, 1 insertion(+) (limited to 'src/core/NEON/wrapper/intrinsics/intrinsics.h') diff --git a/src/core/NEON/wrapper/intrinsics/intrinsics.h b/src/core/NEON/wrapper/intrinsics/intrinsics.h index 495321a6a1..070f3c7065 100644 --- a/src/core/NEON/wrapper/intrinsics/intrinsics.h +++ b/src/core/NEON/wrapper/intrinsics/intrinsics.h @@ -66,6 +66,7 @@ #include "src/core/NEON/wrapper/intrinsics/round.h" #include "src/core/NEON/wrapper/intrinsics/setlane.h" #include "src/core/NEON/wrapper/intrinsics/sin.h" +#include "src/core/NEON/wrapper/intrinsics/sqrt.h" #include "src/core/NEON/wrapper/intrinsics/store.h" #include "src/core/NEON/wrapper/intrinsics/sub.h" #include "src/core/NEON/wrapper/intrinsics/tanh.h" -- cgit v1.2.1