// // Copyright © 2017 Arm Ltd. All rights reserved. // SPDX-License-Identifier: MIT // #include #include "BFloat16.hpp" #include "Half.hpp" #include #include namespace armnnUtils { void FloatingPointConverter::ConvertFloat32To16(const float* srcFloat32Buffer, size_t numElements, void* dstFloat16Buffer) { if (srcFloat32Buffer == nullptr) { throw armnn::InvalidArgumentException("ConvertFloat32To16: source float32 buffer pointer is null"); } if (dstFloat16Buffer == nullptr) { throw armnn::InvalidArgumentException("ConvertFloat32To16: destination float16 buffer pointer is null"); } armnn::Half* pHalf = static_cast(dstFloat16Buffer); for (size_t i = 0; i < numElements; i++) { pHalf[i] = armnn::Half(srcFloat32Buffer[i]); if (isinf(pHalf[i])) { // If the value of converted Fp16 is infinity, round to the closest finite Fp16 value. pHalf[i] = copysign(std::numeric_limits::max(), pHalf[i]); } } } void FloatingPointConverter::ConvertFloat16To32(const void* srcFloat16Buffer, size_t numElements, float* dstFloat32Buffer) { if (srcFloat16Buffer == nullptr) { throw armnn::InvalidArgumentException("ConvertFloat16To32: source float16 buffer pointer is null"); } if (dstFloat32Buffer == nullptr) { throw armnn::InvalidArgumentException("ConvertFloat16To32: destination float32 buffer pointer is null"); } const armnn::Half* pHalf = static_cast(srcFloat16Buffer); for (size_t i = 0; i < numElements; i++) { dstFloat32Buffer[i] = pHalf[i]; } } } //namespace armnnUtils