diff options
Diffstat (limited to 'src/backends/reference/workloads/RefConvertFp32ToFp16Workload.cpp')
-rw-r--r-- | src/backends/reference/workloads/RefConvertFp32ToFp16Workload.cpp | 17 |
1 files changed, 14 insertions, 3 deletions
diff --git a/src/backends/reference/workloads/RefConvertFp32ToFp16Workload.cpp b/src/backends/reference/workloads/RefConvertFp32ToFp16Workload.cpp index c68960fad2..be13458d89 100644 --- a/src/backends/reference/workloads/RefConvertFp32ToFp16Workload.cpp +++ b/src/backends/reference/workloads/RefConvertFp32ToFp16Workload.cpp @@ -16,13 +16,24 @@ namespace armnn void RefConvertFp32ToFp16Workload::Execute() const { + Execute(m_Data.m_Inputs, m_Data.m_Outputs); +} + +void RefConvertFp32ToFp16Workload::ExecuteAsync(WorkingMemDescriptor &workingMemDescriptor) +{ + Execute(workingMemDescriptor.m_Inputs, workingMemDescriptor.m_Outputs); +} + +void RefConvertFp32ToFp16Workload::Execute(std::vector<ITensorHandle*> inputs, + std::vector<ITensorHandle*> outputs) const +{ ARMNN_SCOPED_PROFILING_EVENT(Compute::CpuRef, "RefConvertFp32ToFp16Workload_Execute"); - const float* const input = GetInputTensorDataFloat(0, m_Data); - Half* const output = GetOutputTensorDataHalf(0, m_Data); + const float* const input = reinterpret_cast<const float*>(inputs[0]->Map()); + Half* const output = reinterpret_cast<Half*>(outputs[0]->Map()); // convert Fp32 input to Fp16 output - unsigned int numElements = GetTensorInfo(m_Data.m_Inputs[0]).GetNumElements(); + unsigned int numElements = GetTensorInfo(inputs[0]).GetNumElements(); armnnUtils::FloatingPointConverter::ConvertFloat32To16(input, numElements, output); } |