From 3f16c5758f4f8e71e76e302150f0696a1dcc59fa Mon Sep 17 00:00:00 2001 From: Pablo Marquez Tello Date: Tue, 20 Jun 2023 13:39:10 +0100 Subject: Enable vmfa in arm7va/aarch32 when present * vfma is an extension on armv7a and it can be enabled with -mfpu=neon-vfpv4 * Resolves MLCE-1079 Change-Id: Id455c39ee4feb8d3cdc4515c8307eb8a5d6e093b Signed-off-by: Pablo Marquez Tello Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/9795 Benchmark: Arm Jenkins Tested-by: Arm Jenkins Reviewed-by: Jakub Sujak Comments-Addressed: Arm Jenkins --- src/core/NEON/NEMath.inl | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) (limited to 'src/core') diff --git a/src/core/NEON/NEMath.inl b/src/core/NEON/NEMath.inl index 6198a257fc..1cbe669373 100644 --- a/src/core/NEON/NEMath.inl +++ b/src/core/NEON/NEMath.inl @@ -52,11 +52,11 @@ constexpr float te_sin_coeff5 = 0.013888888889f; // 1/(8*9) #ifndef DOXYGEN_SKIP_THIS inline float32x4_t prefer_vfmaq_f32(float32x4_t a, float32x4_t b, float32x4_t c) { -#ifdef __aarch64__ +#if __ARM_FEATURE_FMA return vfmaq_f32(a, b, c); -#else // __aarch64__ +#else // __ARM_FEATURE_FMA return vmlaq_f32(a, b, c); -#endif // __aarch64__ +#endif // __ARM_FEATURE_FMA } inline float32x4_t vfloorq_f32(float32x4_t val) -- cgit v1.2.1