diff options
author | Pablo Marquez Tello <pablo.tello@arm.com> | 2022-07-19 12:19:46 +0100 |
---|---|---|
committer | Pablo Marquez Tello <pablo.tello@arm.com> | 2022-07-25 15:56:00 +0000 |
commit | d208f4f1c2da9e407f86022959c32e8ab9a4aa6e (patch) | |
tree | f1dc538edb68fa6e266ad8890582f179b961bfae /src/core | |
parent | 962531886eee29527bf027107124a27ce94047eb (diff) | |
download | ComputeLibrary-d208f4f1c2da9e407f86022959c32e8ab9a4aa6e.tar.gz |
Enable march=armv8.6-a in non multi-isa builds
* scons arch=armv8.6-a translates to -march=armv8.6-a
* scons arch=armv8.6-a-sve translates to -march=armv8.6-a+sve
* scons arch=armv8.6-a-sve2 translates to -march=armv8.6-a+sve2
* Resolves COMPMID-5408
Change-Id: I0901e1de864d00109759509af7cc2b5c9ae1cd75
Signed-off-by: Pablo Marquez Tello <pablo.tello@arm.com>
Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/7943
Reviewed-by: Gunes Bayir <gunes.bayir@arm.com>
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Tested-by: Arm Jenkins <bsgcomp@arm.com>
Benchmark: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/core')
-rw-r--r-- | src/core/NEON/wrapper/intrinsics/cvt.h | 6 | ||||
-rw-r--r-- | src/core/common/Registrars.h | 6 |
2 files changed, 6 insertions, 6 deletions
diff --git a/src/core/NEON/wrapper/intrinsics/cvt.h b/src/core/NEON/wrapper/intrinsics/cvt.h index 6e79a92bc2..e52e3dd0c4 100644 --- a/src/core/NEON/wrapper/intrinsics/cvt.h +++ b/src/core/NEON/wrapper/intrinsics/cvt.h @@ -1,5 +1,5 @@ /* - * Copyright (c) 2020 Arm Limited. + * Copyright (c) 2020, 2022 Arm Limited. * * SPDX-License-Identifier: MIT * @@ -72,7 +72,7 @@ vcvt(const float32x4_t &a) return vcvtq_s32_f32(a); } -#if defined(__ARM_FEATURE_BF16_VECTOR_ARITHMETIC) || defined(ARM_COMPUTE_FORCE_BF16) +#if defined(ARM_COMPUTE_ENABLE_BF16) /** Convert 2x128-bit floating point vectors into 1x128-bit bfloat16 vector * * @param[in] inptr Pointer to the input memory to load values from @@ -89,7 +89,7 @@ inline void vcvt_bf16_f32(const float *inptr, uint16_t *outptr) : [outptr] "r"(outptr) : "v0", "v1", "memory"); } -#endif /* defined(__ARM_FEATURE_BF16_VECTOR_ARITHMETIC) || defined(ARM_COMPUTE_FORCE_BF16) */ +#endif /* defined(ARM_COMPUTE_ENABLE_BF16) */ } // namespace wrapper } // namespace arm_compute diff --git a/src/core/common/Registrars.h b/src/core/common/Registrars.h index cc76de2be5..42c1aaa9fa 100644 --- a/src/core/common/Registrars.h +++ b/src/core/common/Registrars.h @@ -167,10 +167,10 @@ #define REGISTER_INTEGER_SVE2(func_name) nullptr #endif /* defined(ENABLE_INTEGER_KERNELS) */ -#if defined(__ARM_FEATURE_BF16_VECTOR_ARITHMETIC) || defined(ARM_COMPUTE_FORCE_BF16) +#if defined(ARM_COMPUTE_ENABLE_BF16) #define REGISTER_BF16_NEON(func_name) &(func_name) -#else /* !(defined(__ARM_FEATURE_BF16_VECTOR_ARITHMETIC) || defined(ARM_COMPUTE_FORCE_BF16))*/ +#else /* !(defined(ARM_COMPUTE_ENABLE_BF16))*/ #define REGISTER_BF16_NEON(func_name) nullptr -#endif /* defined(__ARM_FEATURE_BF16_VECTOR_ARITHMETIC) || defined(ARM_COMPUTE_FORCE_BF16)*/ +#endif /* defined(ARM_COMPUTE_ENABLE_BF16)*/ #endif /* SRC_CORE_COMMON_REGISTRARS_H */ |