1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
|
//
// Copyright © 2020 Arm Ltd and Contributors. All rights reserved.
// SPDX-License-Identifier: MIT
//
#include "ConvertFp32ToBf16TestImpl.hpp"
#include <backendsCommon/test/TensorCopyUtils.hpp>
#include <backendsCommon/test/WorkloadTestUtils.hpp>
#include <test/TensorHelpers.hpp>
LayerTestResult<armnn::BFloat16, 4> ConvertFp32ToBf16Test(
armnn::IWorkloadFactory& workloadFactory,
const armnn::IBackendInternal::IMemoryManagerSharedPtr& memoryManager,
const armnn::ITensorHandleFactory& tensorHandleFactory)
{
IgnoreUnused(memoryManager);
const armnn::TensorInfo inputTensorInfo({1, 2, 4, 3}, armnn::DataType::Float32);
const armnn::TensorInfo outputTensorInfo({1, 2, 4, 3}, armnn::DataType::BFloat16);
auto input = MakeTensor<float, 4>(inputTensorInfo,
{ -37.5f, -15.2f, -8.76f,
-2.0f, -1.5f, -1.3f,
-0.5f, -0.4f, 0.0f,
1.0f, 0.4f, 0.5f,
1.3f, 1.5f, 2.0f,
8.76f, 15.2f, 37.5f,
3.8f, // 0x40733333 Round down
3.1055E+29f, // 0x707ADC3C Round up
9.149516E-10f, // 0x307B7FFF Round down
-3.8f, // 0xC0733333 Round down
-3.1055E+29f, // 0xF07ADC3C Round up
-9.149516E-10f // 0xB07B7FFF Round down
});
std::vector<armnn::BFloat16> outputValues = armnnUtils::QuantizedVector<armnn::BFloat16>(
{
-37.5f, -15.2f, -8.76f,
-2.0f, -1.5f, -1.3f,
-0.5f, -0.4f, 0.0f,
1.0f, 0.4f, 0.5f,
1.3f, 1.5f, 2.0f,
8.76f, 15.2f, 37.5f,
3.796875f, // 0x4073
3.1072295E29f, // 0x707B
9.131327E-10f, // 0x307B
-3.796875f, // 0xC073
-3.1072295E29f, // 0xF07B
-9.131327E-10f // 0xB07B
},
1.0f, 0);
LayerTestResult<armnn::BFloat16, 4> ret(outputTensorInfo);
ret.outputExpected = MakeTensor<armnn::BFloat16, 4>(outputTensorInfo, outputValues);
std::unique_ptr<armnn::ITensorHandle> inputHandle = tensorHandleFactory.CreateTensorHandle(inputTensorInfo);
std::unique_ptr<armnn::ITensorHandle> outputHandle = tensorHandleFactory.CreateTensorHandle(outputTensorInfo);
armnn::ConvertFp32ToBf16QueueDescriptor data;
armnn::WorkloadInfo info;
AddInputToWorkload(data, info, inputTensorInfo, inputHandle.get());
AddOutputToWorkload(data, info, outputTensorInfo, outputHandle.get());
std::unique_ptr<armnn::IWorkload> workload = workloadFactory.CreateConvertFp32ToBf16(data, info);
inputHandle->Allocate();
outputHandle->Allocate();
CopyDataToITensorHandle(inputHandle.get(), &input[0][0][0][0]);
workload->Execute();
CopyDataFromITensorHandle(&ret.output[0][0][0][0], outputHandle.get());
return ret;
}
|