/* * Copyright (c) 2017-2019 ARM Limited. * * SPDX-License-Identifier: MIT * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to * deal in the Software without restriction, including without limitation the * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or * sell copies of the Software, and to permit persons to whom the Software is * furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in all * copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE * SOFTWARE. */ #include "PixelWiseMultiplication.h" #include "tests/validation/Helpers.h" namespace arm_compute { namespace test { namespace validation { namespace reference { template struct is_floating_point : std::integral_constant < bool, std::is_same::type>::value || std::is_same::type>::value || std::is_same::type>::value || std::is_same::type>::value > { }; namespace { /** Compute the result of `src1 * src2 * scale`. The result type always matches the type of @p src2. * * @param[in] src1 An input value. Data types supported: U8/S16/F16/F32. * @param[in] src2 An input value. Data types supported: same as @p src1. * @param[in] scale Scale to apply after multiplication. * Scale must be positive and its value must be either 1/255 or 1/2^n where n is between 0 and 15. * @param[in] convert_policy Overflow policy. Supported overflow policies: Wrap, Saturate * @param[in] rounding_policy Rounding policy. Supported rounding modes: to zero, to nearest even. */ template T2 mul(const T1 src1, const T2 src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy) { using intermediate_type = typename common_promoted_signed_type::intermediate_type; const double val = static_cast(src1) * static_cast(src2) * static_cast(scale); if(is_floating_point::value) { const auto result = static_cast(val); return result; } else { double rounded_val = 0; switch(rounding_policy) { case(RoundingPolicy::TO_ZERO): rounded_val = support::cpp11::trunc(val); break; case(RoundingPolicy::TO_NEAREST_UP): rounded_val = round_half_up(val); break; case(RoundingPolicy::TO_NEAREST_EVEN): rounded_val = round_half_even(val); break; default: ARM_COMPUTE_ERROR("Unsupported rounding policy"); } const auto result = static_cast((convert_policy == ConvertPolicy::SATURATE) ? saturate_cast(rounded_val) : rounded_val); return result; } } template struct BroadcastUnroll { template static void unroll(const SimpleTensor &src1, const SimpleTensor &src2, SimpleTensor &dst, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy, Coordinates &id_src1, Coordinates &id_src2, Coordinates &id_dst) { const bool src1_is_broadcast = (src1.shape()[dim - 1] != dst.shape()[dim - 1]); const bool src2_is_broadcast = (src2.shape()[dim - 1] != dst.shape()[dim - 1]); id_src1.set(dim - 1, 0); id_src2.set(dim - 1, 0); id_dst.set(dim - 1, 0); for(size_t i = 0; i < dst.shape()[dim - 1]; ++i, ++id_dst[dim - 1]) { BroadcastUnroll < dim - 1 >::unroll(src1, src2, dst, scale, convert_policy, rounding_policy, id_src1, id_src2, id_dst); id_src1[dim - 1] += !src1_is_broadcast; id_src2[dim - 1] += !src2_is_broadcast; } } }; template <> struct BroadcastUnroll<0> { template static void unroll(const SimpleTensor &src1, const SimpleTensor &src2, SimpleTensor &dst, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy, Coordinates &id_src1, Coordinates &id_src2, Coordinates &id_dst) { dst[coord2index(dst.shape(), id_dst)] = mul(src1[coord2index(src1.shape(), id_src1)], src2[coord2index(src2.shape(), id_src2)], scale, convert_policy, rounding_policy); } }; } // namespace template SimpleTensor pixel_wise_multiplication(const SimpleTensor &src1, const SimpleTensor &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy, QuantizationInfo qout) { ARM_COMPUTE_UNUSED(qout); SimpleTensor dst(TensorShape::broadcast_shape(src1.shape(), src2.shape()), src2.data_type()); if(scale < 0) { ARM_COMPUTE_ERROR("Scale of pixel-wise multiplication must be non-negative"); } Coordinates id_src1{}; Coordinates id_src2{}; Coordinates id_dst{}; BroadcastUnroll::unroll(src1, src2, dst, scale, convert_policy, rounding_policy, id_src1, id_src2, id_dst); return dst; } template <> SimpleTensor pixel_wise_multiplication(const SimpleTensor &src1, const SimpleTensor &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy, QuantizationInfo qout) { SimpleTensor dst(TensorShape::broadcast_shape(src1.shape(), src2.shape()), src2.data_type(), 1, qout); if(src1.data_type() == DataType::QASYMM8 && src2.data_type() == DataType::QASYMM8) { SimpleTensor src1_tmp = convert_from_asymmetric(src1); SimpleTensor src2_tmp = convert_from_asymmetric(src2); SimpleTensor dst_tmp = pixel_wise_multiplication(src1_tmp, src2_tmp, scale, convert_policy, rounding_policy, qout); dst = convert_to_asymmetric(dst_tmp, qout); } else { if(scale < 0) { ARM_COMPUTE_ERROR("Scale of pixel-wise multiplication must be non-negative"); } Coordinates id_src1{}; Coordinates id_src2{}; Coordinates id_dst{}; BroadcastUnroll::unroll(src1, src2, dst, scale, convert_policy, rounding_policy, id_src1, id_src2, id_dst); } return dst; } // *INDENT-OFF* // clang-format off template SimpleTensor pixel_wise_multiplication(const SimpleTensor &src1, const SimpleTensor &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy, QuantizationInfo qout); template SimpleTensor pixel_wise_multiplication(const SimpleTensor &src1, const SimpleTensor &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy, QuantizationInfo qout); template SimpleTensor pixel_wise_multiplication(const SimpleTensor &src1, const SimpleTensor &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy, QuantizationInfo qout); template SimpleTensor pixel_wise_multiplication(const SimpleTensor &src1, const SimpleTensor &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy, QuantizationInfo qout); // clang-format on // *INDENT-ON* } // namespace reference } // namespace validation } // namespace test } // namespace arm_compute