diff options
author | Ramy Elgammal <ramy.elgammal@arm.com> | 2023-03-31 16:16:15 +0100 |
---|---|---|
committer | Ramy Elgammal <ramy.elgammal@arm.com> | 2023-04-11 09:27:02 +0000 |
commit | 8b7f42aa0e76a65a4ffa46ee875df6a6220695ae (patch) | |
tree | 3bc006b26a659e5b404dbda48ecb259626d26fef /tests/validation/NEON/ElementwiseAbsoluteValue.cpp | |
parent | dcab9ca1b7914eb8cadadfaa5fb468e469dca5d9 (diff) | |
download | ComputeLibrary-8b7f42aa0e76a65a4ffa46ee875df6a6220695ae.tar.gz |
Enable quantized data types for CpuElementwiseUnary on Armv7a
- Adding fallback functions neon_qasymm8_signed_elementwise_unary() and
neon_qasymm8_elementwise_unary()
- They would be called in case target is not aarch64
Resolves: COMPMID-5994
Change-Id: Id0db1e7cb0fe92f1eaef0b3a9ed2bea01b3f2a15
Signed-off-by: Ramy Elgammal <ramy.elgammal@arm.com>
Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/9416
Tested-by: Arm Jenkins <bsgcomp@arm.com>
Reviewed-by: Viet-Hoa Do <viet-hoa.do@arm.com>
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Benchmark: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'tests/validation/NEON/ElementwiseAbsoluteValue.cpp')
-rw-r--r-- | tests/validation/NEON/ElementwiseAbsoluteValue.cpp | 7 |
1 files changed, 6 insertions, 1 deletions
diff --git a/tests/validation/NEON/ElementwiseAbsoluteValue.cpp b/tests/validation/NEON/ElementwiseAbsoluteValue.cpp index 7f6a6a5bb2..0667ac73f9 100644 --- a/tests/validation/NEON/ElementwiseAbsoluteValue.cpp +++ b/tests/validation/NEON/ElementwiseAbsoluteValue.cpp @@ -46,8 +46,13 @@ RelativeTolerance<float> tolerance_fp32(0.000001f); #ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC RelativeTolerance<float> tolerance_fp16(0.01f); #endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC +#if defined(__aarch64__) constexpr AbsoluteTolerance<uint8_t> tolerance_qasymm8(0); constexpr AbsoluteTolerance<int8_t> tolerance_qasymm8_signed(0); +#else // #if !defined(__aarch64__) +constexpr AbsoluteTolerance<uint8_t> tolerance_qasymm8(1); // There is difference of 1, because quantizing in reference uses round policy "TO_NEAREST_UP", where the armv7a neon kernel uses "TO_ZERO" +constexpr AbsoluteTolerance<int8_t> tolerance_qasymm8_signed(1); +#endif // #if !defined(__aarch64__) } // namespace TEST_SUITE(NEON) @@ -136,8 +141,8 @@ FIXTURE_DATA_TEST_CASE(RunSmall, NEAbsLayerQuantizedFixture<int8_t>, framework:: validate(Accessor(_target), _reference, tolerance_qasymm8_signed); } TEST_SUITE_END() // QASYMM8_SIGNED - TEST_SUITE_END() // Quantized + TEST_SUITE_END() // AbsLayer TEST_SUITE_END() // Neon } // namespace validation |