ArmNN
 22.02
ClConvertFp32ToFp16Workload.cpp
Go to the documentation of this file.
1 //
2 // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 
7 #include <cl/ClTensorHandle.hpp>
8 
9 #include "ClWorkloadUtils.hpp"
10 
11 namespace armnn
12 {
13 using namespace armcomputetensorutils;
14 
15 static constexpr arm_compute::ConvertPolicy g_AclConvertPolicy = arm_compute::ConvertPolicy::SATURATE;
16 
18  const ConvertFp32ToFp16QueueDescriptor& descriptor,
19  const WorkloadInfo& info,
20  const arm_compute::CLCompileContext& clCompileContext) :
22 {
23  this->m_Data.ValidateInputsOutputs("ClConvertFp32ToFp16Workload", 1, 1);
24 
25  arm_compute::ICLTensor& input = static_cast<IClTensorHandle*>(this->m_Data.m_Inputs[0])->GetTensor();
26  arm_compute::ICLTensor& output = static_cast<IClTensorHandle*>(this->m_Data.m_Outputs[0])->GetTensor();
27 
28  // Create Proxy tensor and set the initial tensor handle to it
29  m_InputProxy = std::make_unique<ICLTensorProxy>(&input);
30  m_OutputProxy = std::make_unique<ICLTensorProxy>(&output);
31 
32  {
33  ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "ClConvertFp32ToFp16Workload_configure");
34  m_Layer.configure(clCompileContext, m_InputProxy.get(), m_OutputProxy.get(), g_AclConvertPolicy, 0);
35  }
36 }
37 
39 {
40  ARMNN_SCOPED_PROFILING_EVENT_CL_GUID("ClConvertFp32ToFp16Workload_Execute", this->GetGuid());
41  RunClFunction(m_Layer, CHECK_LOCATION());
42 }
43 
45 {
46  if (input.GetDataType() != DataType::Float32)
47  {
48  return arm_compute::Status(arm_compute::ErrorCode::RUNTIME_ERROR, "Input should be Float32");
49  }
50  if (output.GetDataType() != DataType::Float16)
51  {
52  return arm_compute::Status(arm_compute::ErrorCode::RUNTIME_ERROR, "Output should be Float16");
53  }
54 
55  const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input);
56  const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output);
57 
58  const arm_compute::Status aclStatus = arm_compute::CLDepthConvertLayer::validate(
59  &aclInputInfo, &aclOutputInfo, g_AclConvertPolicy, 0);
60 
61  return aclStatus;
62 }
63 
65 {
66  ITensorHandle* backupHandle = this->m_Data.m_Inputs[slot];
67  this->m_Data.m_Inputs[slot] = tensorHandle;
68  try
69  {
70  Reconfigure();
71  }
73  {
74  // Cannot reconfigure, revert the slot back and throw the exception.
75  this->m_Data.m_Inputs[slot] = backupHandle;
76  throw e;
77  }
78 }
79 
80 // Replace output tensor handle with the given TensorHandle
82 {
83  ITensorHandle* backupHandle = this->m_Data.m_Inputs[slot];
84  this->m_Data.m_Inputs[slot] = tensorHandle;
85  try
86  {
87  Reconfigure();
88  }
90  {
91  // Cannot reconfigure, revert the slot back and throw the exception.
92  this->m_Data.m_Inputs[slot] = backupHandle;
93  throw e;
94  }
95 }
96 
97 void ClConvertFp32ToFp16Workload::Reconfigure()
98 {
99  arm_compute::ICLTensor& input = static_cast<IClTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
100  arm_compute::ICLTensor& output = static_cast<IClTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
101  m_InputProxy->set(&input);
102  m_OutputProxy->set(&output);
103 }
104 
105 } //namespace armnn
#define ARMNN_SCOPED_PROFILING_EVENT_CL_GUID(name, guid)
arm_compute::Status ClConvertFp32ToFp16WorkloadValidate(const TensorInfo &input, const TensorInfo &output)
void RunClFunction(arm_compute::IFunction &function, const CheckLocation &location)
void ValidateInputsOutputs(const std::string &descName, unsigned int numExpectedIn, unsigned int numExpectedOut) const
Copyright (c) 2021 ARM Limited and Contributors.
#define ARMNN_SCOPED_PROFILING_EVENT(backendId, name)
Definition: Profiling.hpp:220
QueueDescriptor m_Data
Definition: Workload.hpp:77
DataType GetDataType() const
Definition: Tensor.hpp:198
Status
enumeration
Definition: Types.hpp:29
void ReplaceInputTensorHandle(ITensorHandle *tensorHandle, unsigned int slot) override
#define CHECK_LOCATION()
Definition: Exceptions.hpp:209
void ReplaceOutputTensorHandle(ITensorHandle *tensorHandle, unsigned int slot) override
ClConvertFp32ToFp16Workload(const ConvertFp32ToFp16QueueDescriptor &descriptor, const WorkloadInfo &info, const arm_compute::CLCompileContext &clCompileContext)
profiling::ProfilingGuid GetGuid() const final
Definition: Workload.hpp:55
std::vector< ITensorHandle * > m_Outputs
Contains information about TensorInfos of a layer.
std::vector< ITensorHandle * > m_Inputs