ArmNN
 21.11
ClWorkloadFactory.hpp
Go to the documentation of this file.
1 //
2 // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 #pragma once
6 
7 #include <armnn/IRuntime.hpp>
8 #include <armnn/Optional.hpp>
9 
11 
14 
15 #include <arm_compute/core/CL/CLCompileContext.h>
16 
17 namespace armnn
18 {
19 
20 // ARM Compute OpenCL workload factory.
22 {
23 public:
24  ClWorkloadFactory(const std::shared_ptr<ClMemoryManager>& memoryManager);
25 
26  ClWorkloadFactory(const std::shared_ptr<ClMemoryManager>& memoryManager,
28 
29  void AfterWorkloadsCreated() override;
30 
31  const BackendId& GetBackendId() const override;
32 
33  static bool IsLayerSupported(const Layer& layer,
34  Optional<DataType> dataType,
35  std::string& outReasonIfUnsupported);
36 
37  static bool IsLayerSupported(const IConnectableLayer& layer,
38  Optional<DataType> dataType,
39  std::string& outReasonIfUnsupported,
40  const ModelOptions& modelOptions);
41 
42  bool SupportsSubTensors() const override { return true; }
43 
44  ARMNN_DEPRECATED_MSG("Use ITensorHandleFactory::CreateSubTensorHandle instead")
45  std::unique_ptr<ITensorHandle> CreateSubTensorHandle(ITensorHandle& parent,
46  TensorShape const& subTensorShape,
47  unsigned int const* subTensorOrigin) const override;
48 
49  ARMNN_DEPRECATED_MSG("Use ITensorHandleFactory::CreateTensorHandle instead")
50  std::unique_ptr<ITensorHandle> CreateTensorHandle(const TensorInfo& tensorInfo,
51  const bool IsMemoryManaged = true) const override;
52 
53  ARMNN_DEPRECATED_MSG("Use ITensorHandleFactory::CreateTensorHandle instead")
54  std::unique_ptr<ITensorHandle> CreateTensorHandle(const TensorInfo& tensorInfo,
55  DataLayout dataLayout,
56  const bool IsMemoryManaged = true) const override;
57 
58  std::unique_ptr<IWorkload> CreateActivation(const ActivationQueueDescriptor& descriptor,
59  const WorkloadInfo& info) const override;
60 
61  std::unique_ptr<IWorkload> CreateAddition(const AdditionQueueDescriptor& descriptor,
62  const WorkloadInfo& info) const override;
63 
64  std::unique_ptr<IWorkload> CreateArgMinMax(const ArgMinMaxQueueDescriptor& descriptor,
65  const WorkloadInfo& info) const override;
66 
67  std::unique_ptr<IWorkload> CreateBatchNormalization(const BatchNormalizationQueueDescriptor& descriptor,
68  const WorkloadInfo& info) const override;
69 
70  std::unique_ptr<IWorkload> CreateBatchToSpaceNd(const BatchToSpaceNdQueueDescriptor& descriptor,
71  const WorkloadInfo& info) const override;
72 
73  std::unique_ptr<IWorkload> CreateCast(const CastQueueDescriptor& descriptor,
74  const WorkloadInfo& info) const override;
75 
76  std::unique_ptr<IWorkload> CreateChannelShuffle(const ChannelShuffleQueueDescriptor& descriptor,
77  const WorkloadInfo& info) const override;
78 
79  std::unique_ptr<IWorkload> CreateComparison(const ComparisonQueueDescriptor& descriptor,
80  const WorkloadInfo& info) const override;
81 
82  std::unique_ptr<IWorkload> CreateConcat(const ConcatQueueDescriptor& descriptor,
83  const WorkloadInfo& info) const override;
84 
85  std::unique_ptr<IWorkload> CreateConstant(const ConstantQueueDescriptor& descriptor,
86  const WorkloadInfo& info) const override;
87 
88  std::unique_ptr<IWorkload> CreateConvertFp16ToFp32(const ConvertFp16ToFp32QueueDescriptor& descriptor,
89  const WorkloadInfo& info) const override;
90 
91  std::unique_ptr<IWorkload> CreateConvertFp32ToFp16(const ConvertFp32ToFp16QueueDescriptor& descriptor,
92  const WorkloadInfo& info) const override;
93 
94  std::unique_ptr<IWorkload> CreateConvolution2d(const Convolution2dQueueDescriptor& descriptor,
95  const WorkloadInfo& info) const override;
96 
97  std::unique_ptr<IWorkload> CreateConvolution3d(const Convolution3dQueueDescriptor& descriptor,
98  const WorkloadInfo& info) const override;
99 
100  std::unique_ptr<IWorkload> CreateDebug(const DebugQueueDescriptor& descriptor,
101  const WorkloadInfo& info) const override;
102 
103  std::unique_ptr<IWorkload> CreateDepthToSpace(const DepthToSpaceQueueDescriptor& descriptor,
104  const WorkloadInfo& info) const override;
105 
106  std::unique_ptr<IWorkload> CreateDepthwiseConvolution2d(const DepthwiseConvolution2dQueueDescriptor& descriptor,
107  const WorkloadInfo& info) const override;
108 
109  std::unique_ptr<IWorkload> CreateDequantize(const DequantizeQueueDescriptor& descriptor,
110  const WorkloadInfo& info) const override;
111 
112  std::unique_ptr<IWorkload> CreateDetectionPostProcess(const DetectionPostProcessQueueDescriptor& descriptor,
113  const WorkloadInfo& info) const override;
114 
115  std::unique_ptr<IWorkload> CreateDivision(const DivisionQueueDescriptor& descriptor,
116  const WorkloadInfo& info) const override;
117 
118  std::unique_ptr<IWorkload> CreateElementwiseUnary(const ElementwiseUnaryQueueDescriptor& descriptor,
119  const WorkloadInfo& info) const override;
120 
121  std::unique_ptr<IWorkload> CreateFill(const FillQueueDescriptor& descriptor,
122  const WorkloadInfo& info) const override;
123 
124  std::unique_ptr<IWorkload> CreateFloor(const FloorQueueDescriptor& descriptor,
125  const WorkloadInfo& info) const override;
126 
127  std::unique_ptr<IWorkload> CreateFullyConnected(const FullyConnectedQueueDescriptor& descriptor,
128  const WorkloadInfo& info) const override;
129 
130  std::unique_ptr<IWorkload> CreateGather(const GatherQueueDescriptor& descriptor,
131  const WorkloadInfo& info) const override;
132 
133  std::unique_ptr<IWorkload> CreateInput(const InputQueueDescriptor& descriptor,
134  const WorkloadInfo& info) const override;
135 
136  std::unique_ptr<IWorkload> CreateInstanceNormalization(const InstanceNormalizationQueueDescriptor& descriptor,
137  const WorkloadInfo& info) const override;
138 
139  std::unique_ptr<IWorkload> CreateL2Normalization(const L2NormalizationQueueDescriptor& descriptor,
140  const WorkloadInfo& info) const override;
141 
142  std::unique_ptr<IWorkload> CreateLogicalBinary(const LogicalBinaryQueueDescriptor& descriptor,
143  const WorkloadInfo& info) const override;
144 
145  std::unique_ptr<IWorkload> CreateLogSoftmax(const LogSoftmaxQueueDescriptor& descriptor,
146  const WorkloadInfo& info) const override;
147 
148  std::unique_ptr<IWorkload> CreateLstm(const LstmQueueDescriptor& descriptor,
149  const WorkloadInfo& info) const override;
150 
151  std::unique_ptr<IWorkload> CreateMaximum(const MaximumQueueDescriptor& descriptor,
152  const WorkloadInfo& info) const override;
153 
154  std::unique_ptr<IWorkload> CreateMean(const MeanQueueDescriptor& descriptor,
155  const WorkloadInfo& Info) const override;
156 
157  std::unique_ptr<IWorkload> CreateMemCopy(const MemCopyQueueDescriptor& descriptor,
158  const WorkloadInfo& info) const override;
159 
160  std::unique_ptr<IWorkload> CreateMemImport(const MemImportQueueDescriptor& descriptor,
161  const WorkloadInfo& info) const override;
162 
163  std::unique_ptr<IWorkload> CreateMinimum(const MinimumQueueDescriptor& descriptor,
164  const WorkloadInfo& info) const override;
165 
166  std::unique_ptr<IWorkload> CreateMultiplication(const MultiplicationQueueDescriptor& descriptor,
167  const WorkloadInfo& info) const override;
168 
169  std::unique_ptr<IWorkload> CreateNormalization(const NormalizationQueueDescriptor& descriptor,
170  const WorkloadInfo& info) const override;
171 
172  std::unique_ptr<IWorkload> CreateOutput(const OutputQueueDescriptor& descriptor,
173  const WorkloadInfo& info) const override;
174 
175  std::unique_ptr<IWorkload> CreatePad(const PadQueueDescriptor& descriptor,
176  const WorkloadInfo& info) const override;
177 
178  std::unique_ptr<IWorkload> CreatePermute(const PermuteQueueDescriptor& descriptor,
179  const WorkloadInfo& info) const override;
180 
181  std::unique_ptr<IWorkload> CreatePooling2d(const Pooling2dQueueDescriptor& descriptor,
182  const WorkloadInfo& info) const override;
183 
184  std::unique_ptr<IWorkload> CreatePreCompiled(const PreCompiledQueueDescriptor& descriptor,
185  const WorkloadInfo& info) const override;
186 
187  std::unique_ptr<IWorkload> CreatePrelu(const PreluQueueDescriptor& descriptor,
188  const WorkloadInfo& info) const override;
189 
190  std::unique_ptr<IWorkload> CreateQLstm(const QLstmQueueDescriptor& descriptor,
191  const WorkloadInfo& info) const override;
192 
193  std::unique_ptr<IWorkload> CreateQuantize(const QuantizeQueueDescriptor& descriptor,
194  const WorkloadInfo& info) const override;
195 
196  std::unique_ptr<IWorkload> CreateQuantizedLstm(const QuantizedLstmQueueDescriptor& descriptor,
197  const WorkloadInfo& info) const override;
198 
199  std::unique_ptr<IWorkload> CreateRank(const RankQueueDescriptor& descriptor,
200  const WorkloadInfo& info) const override;
201 
202  std::unique_ptr<IWorkload> CreateReduce(const ReduceQueueDescriptor& descriptor,
203  const WorkloadInfo& info) const override;
204 
205  std::unique_ptr<IWorkload> CreateReshape(const ReshapeQueueDescriptor& descriptor,
206  const WorkloadInfo& info) const override;
207 
208  std::unique_ptr<IWorkload> CreateResize(const ResizeQueueDescriptor& descriptor,
209  const WorkloadInfo& info) const override;
210 
211  std::unique_ptr<IWorkload> CreateSlice(const SliceQueueDescriptor& descriptor,
212  const WorkloadInfo& info) const override;
213 
214  std::unique_ptr<IWorkload> CreateSoftmax(const SoftmaxQueueDescriptor& descriptor,
215  const WorkloadInfo& info) const override;
216 
217  std::unique_ptr<IWorkload> CreateSpaceToBatchNd(const SpaceToBatchNdQueueDescriptor& descriptor,
218  const WorkloadInfo& info) const override;
219 
220  std::unique_ptr<IWorkload> CreateSpaceToDepth(const SpaceToDepthQueueDescriptor& descriptor,
221  const WorkloadInfo& info) const override;
222 
223  std::unique_ptr<IWorkload> CreateSplitter(const SplitterQueueDescriptor& descriptor,
224  const WorkloadInfo& info) const override;
225 
226  std::unique_ptr<IWorkload> CreateStack(const StackQueueDescriptor& descriptor,
227  const WorkloadInfo& info) const override;
228 
229  std::unique_ptr<IWorkload> CreateStridedSlice(const StridedSliceQueueDescriptor& descriptor,
230  const WorkloadInfo& info) const override;
231 
232  std::unique_ptr<IWorkload> CreateSubtraction(const SubtractionQueueDescriptor& descriptor,
233  const WorkloadInfo& info) const override;
234 
235  std::unique_ptr<IWorkload> CreateTranspose(const TransposeQueueDescriptor& descriptor,
236  const WorkloadInfo& info) const override;
237 
238  std::unique_ptr<IWorkload> CreateTransposeConvolution2d(const TransposeConvolution2dQueueDescriptor& descriptor,
239  const WorkloadInfo& info) const override;
240 
241 private:
242  template<typename FloatWorkload, typename Uint8Workload, typename QueueDescriptorType, typename... Args>
243  static std::unique_ptr<IWorkload> MakeWorkload(const QueueDescriptorType& descriptor,
244  const WorkloadInfo& info,
245  Args&&... args);
246 
247  template <typename Workload, typename QueueDescriptorType, typename... Args>
248  static std::unique_ptr<IWorkload> MakeWorkload(const QueueDescriptorType& descriptor,
249  const WorkloadInfo& info,
250  Args&&... args);
251 
252  void InitializeCLCompileContext();
253 
254  mutable std::shared_ptr<ClMemoryManager> m_MemoryManager;
256  arm_compute::CLCompileContext m_CLCompileContext;
257 };
258 
259 } // namespace armnn
std::unique_ptr< IWorkload > CreateDetectionPostProcess(const DetectionPostProcessQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< ITensorHandle > CreateSubTensorHandle(ITensorHandle &parent, TensorShape const &subTensorShape, unsigned int const *subTensorOrigin) const override
std::unique_ptr< IWorkload > CreateComparison(const ComparisonQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateGather(const GatherQueueDescriptor &descriptor, const WorkloadInfo &info) const override
ClWorkloadFactory(const std::shared_ptr< ClMemoryManager > &memoryManager)
Interface for a layer that is connectable to other layers via InputSlots and OutputSlots.
Definition: INetwork.hpp:61
std::unique_ptr< IWorkload > CreateDebug(const DebugQueueDescriptor &descriptor, const WorkloadInfo &info) const override
DataLayout
Definition: Types.hpp:49
std::unique_ptr< IWorkload > CreateReshape(const ReshapeQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateConvolution3d(const Convolution3dQueueDescriptor &descriptor, const WorkloadInfo &info) const override
void AfterWorkloadsCreated() override
std::unique_ptr< IWorkload > CreateConvertFp32ToFp16(const ConvertFp32ToFp16QueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateSpaceToBatchNd(const SpaceToBatchNdQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateDivision(const DivisionQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::vector< BackendOptions > ModelOptions
std::unique_ptr< IWorkload > CreateStridedSlice(const StridedSliceQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateConvertFp16ToFp32(const ConvertFp16ToFp32QueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateQuantize(const QuantizeQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateInput(const InputQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateStack(const StackQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateFullyConnected(const FullyConnectedQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateSlice(const SliceQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< ITensorHandle > CreateTensorHandle(const TensorInfo &tensorInfo, const bool IsMemoryManaged=true) const override
std::unique_ptr< IWorkload > CreateQuantizedLstm(const QuantizedLstmQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateRank(const RankQueueDescriptor &descriptor, const WorkloadInfo &info) const override
const BackendId & GetBackendId() const override
bool SupportsSubTensors() const override
Copyright (c) 2021 ARM Limited and Contributors.
TypedWorkload< QueueDescriptor, armnn::DataType::Float16, armnn::DataType::Float32 > FloatWorkload
Definition: Workload.hpp:170
std::unique_ptr< IWorkload > CreateLstm(const LstmQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateLogicalBinary(const LogicalBinaryQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateLogSoftmax(const LogSoftmaxQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateMean(const MeanQueueDescriptor &descriptor, const WorkloadInfo &Info) const override
std::unique_ptr< IWorkload > CreateReduce(const ReduceQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateMinimum(const MinimumQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateTransposeConvolution2d(const TransposeConvolution2dQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateFill(const FillQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateCast(const CastQueueDescriptor &descriptor, const WorkloadInfo &info) const override
static bool IsLayerSupported(const Layer &layer, Optional< DataType > dataType, std::string &outReasonIfUnsupported)
std::unique_ptr< IWorkload > CreateQLstm(const QLstmQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateDepthwiseConvolution2d(const DepthwiseConvolution2dQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateDepthToSpace(const DepthToSpaceQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateChannelShuffle(const ChannelShuffleQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::shared_ptr< IBackendModelContext > IBackendSpecificModelContextPtr
std::unique_ptr< IWorkload > CreateResize(const ResizeQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreatePermute(const PermuteQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateMemCopy(const MemCopyQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateBatchToSpaceNd(const BatchToSpaceNdQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateSoftmax(const SoftmaxQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateMaximum(const MaximumQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateElementwiseUnary(const ElementwiseUnaryQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateFloor(const FloorQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreatePreCompiled(const PreCompiledQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateSubtraction(const SubtractionQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateMultiplication(const MultiplicationQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateAddition(const AdditionQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreatePooling2d(const Pooling2dQueueDescriptor &descriptor, const WorkloadInfo &info) const override
TypedWorkload< QueueDescriptor, armnn::DataType::QAsymmU8 > Uint8Workload
Definition: Workload.hpp:176
std::unique_ptr< IWorkload > CreateSplitter(const SplitterQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateL2Normalization(const L2NormalizationQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateActivation(const ActivationQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreatePad(const PadQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateSpaceToDepth(const SpaceToDepthQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateNormalization(const NormalizationQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateInstanceNormalization(const InstanceNormalizationQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateTranspose(const TransposeQueueDescriptor &descriptor, const WorkloadInfo &info) const override
Contains information about TensorInfos of a layer.
#define ARMNN_DEPRECATED_MSG(message)
Definition: Deprecated.hpp:43
std::unique_ptr< IWorkload > CreateBatchNormalization(const BatchNormalizationQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateConcat(const ConcatQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateMemImport(const MemImportQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreatePrelu(const PreluQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateDequantize(const DequantizeQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateConstant(const ConstantQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateConvolution2d(const Convolution2dQueueDescriptor &descriptor, const WorkloadInfo &info) const override
std::unique_ptr< IWorkload > CreateArgMinMax(const ArgMinMaxQueueDescriptor &descriptor, const WorkloadInfo &info) const override
Depthwise Convolution 2D layer workload data.
std::unique_ptr< IWorkload > CreateOutput(const OutputQueueDescriptor &descriptor, const WorkloadInfo &info) const override