aboutsummaryrefslogtreecommitdiff
path: root/src/backends/reference/workloads/RefElementwiseWorkload.cpp
blob: 356d7a0c166777ceb0a542fb2e1e5dd21a311ed1 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
//
// Copyright © 2017 Arm Ltd. All rights reserved.
// SPDX-License-Identifier: MIT
//

#include "RefElementwiseWorkload.hpp"
#include "ElementwiseFunction.hpp"
#include "RefWorkloadUtils.hpp"
#include "Profiling.hpp"
#include "StringMapping.hpp"
#include "TypeUtils.hpp"
#include <vector>

namespace armnn
{

template <typename Functor,
          typename armnn::DataType DataType,
          typename ParentDescriptor,
          typename armnn::StringMapping::Id DebugString>
void RefElementwiseWorkload<Functor, DataType, ParentDescriptor, DebugString>::Execute() const
{
    ARMNN_SCOPED_PROFILING_EVENT(Compute::CpuRef, StringMapping::Instance().Get(DebugString));

    const TensorInfo& inputInfo0 = GetTensorInfo(m_Data.m_Inputs[0]);
    const TensorInfo& inputInfo1 = GetTensorInfo(m_Data.m_Inputs[1]);
    const TensorInfo& outputInfo = GetTensorInfo(m_Data.m_Outputs[0]);

    const TensorShape& inShape0 = inputInfo0.GetShape();
    const TensorShape& inShape1 = inputInfo1.GetShape();
    const TensorShape& outShape = outputInfo.GetShape();

    switch(DataType)
    {
        case armnn::DataType::QuantisedAsymm8:
        {
            std::vector<float> results(outputInfo.GetNumElements());
            ElementwiseFunction<Functor, float, float>(inShape0,
                                                       inShape1,
                                                       outShape,
                                                       Dequantize(GetInputTensorDataU8(0, m_Data), inputInfo0).data(),
                                                       Dequantize(GetInputTensorDataU8(1, m_Data), inputInfo1).data(),
                                                       results.data());
            Quantize(GetOutputTensorDataU8(0, m_Data), results.data(), outputInfo);
            break;
        }
        case armnn::DataType::Float32:
        {
            ElementwiseFunction<Functor, float, float>(inShape0,
                                                       inShape1,
                                                       outShape,
                                                       GetInputTensorDataFloat(0, m_Data),
                                                       GetInputTensorDataFloat(1, m_Data),
                                                       GetOutputTensorDataFloat(0, m_Data));
            break;
        }
        default:
            BOOST_ASSERT_MSG(false, "Unknown Data Type!");
            break;
    }
}

}

template class armnn::RefElementwiseWorkload<std::plus<float>,
    armnn::DataType::Float32,
    armnn::AdditionQueueDescriptor,
    armnn::StringMapping::RefAdditionWorkload_Execute>;

template class armnn::RefElementwiseWorkload<std::plus<float>,
    armnn::DataType::QuantisedAsymm8,
    armnn::AdditionQueueDescriptor,
    armnn::StringMapping::RefAdditionWorkload_Execute>;

template class armnn::RefElementwiseWorkload<std::minus<float>,
    armnn::DataType::Float32,
    armnn::SubtractionQueueDescriptor,
    armnn::StringMapping::RefSubtractionWorkload_Execute>;

template class armnn::RefElementwiseWorkload<std::minus<float>,
    armnn::DataType::QuantisedAsymm8,
    armnn::SubtractionQueueDescriptor,
    armnn::StringMapping::RefSubtractionWorkload_Execute>;

template class armnn::RefElementwiseWorkload<std::multiplies<float>,
    armnn::DataType::Float32,
    armnn::MultiplicationQueueDescriptor,
    armnn::StringMapping::RefMultiplicationWorkload_Execute>;

template class armnn::RefElementwiseWorkload<std::multiplies<float>,
    armnn::DataType::QuantisedAsymm8,
    armnn::MultiplicationQueueDescriptor,
    armnn::StringMapping::RefMultiplicationWorkload_Execute>;

template class armnn::RefElementwiseWorkload<std::divides<float>,
    armnn::DataType::Float32,
    armnn::DivisionQueueDescriptor,
    armnn::StringMapping::RefDivisionWorkload_Execute>;

template class armnn::RefElementwiseWorkload<std::divides<float>,
    armnn::DataType::QuantisedAsymm8,
    armnn::DivisionQueueDescriptor,
    armnn::StringMapping::RefDivisionWorkload_Execute>;

template class armnn::RefElementwiseWorkload<armnn::maximum<float>,
    armnn::DataType::Float32,
    armnn::MaximumQueueDescriptor,
    armnn::StringMapping::RefMaximumWorkload_Execute>;

template class armnn::RefElementwiseWorkload<armnn::maximum<float>,
    armnn::DataType::QuantisedAsymm8,
    armnn::MaximumQueueDescriptor,
    armnn::StringMapping::RefMaximumWorkload_Execute>;


template class armnn::RefElementwiseWorkload<armnn::minimum<float>,
    armnn::DataType::Float32,
    armnn::MinimumQueueDescriptor,
    armnn::StringMapping::RefMinimumWorkload_Execute>;

template class armnn::RefElementwiseWorkload<armnn::minimum<float>,
    armnn::DataType::QuantisedAsymm8,
    armnn::MinimumQueueDescriptor,
    armnn::StringMapping::RefMinimumWorkload_Execute>;