ArmNN
 21.02
ClConcatWorkload.cpp
Go to the documentation of this file.
1 //
2 // Copyright © 2017 Arm Ltd. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 #include "ClConcatWorkload.hpp"
6 #include "ClWorkloadUtils.hpp"
10 #include <cl/ClTensorHandle.hpp>
11 #include <cl/ClLayerSupport.hpp>
12 
13 #include <arm_compute/core/Types.h>
14 
15 namespace armnn
16 {
17 using namespace armcomputetensorutils;
18 
19 namespace
20 {
21 size_t CalcAxis(const OriginsDescriptor& desc)
22 {
23  return (desc.GetNumDimensions() - desc.GetConcatAxis()) - 1;
24 }
25 } //namespace
26 
27 arm_compute::Status ClConcatWorkloadValidate(const std::vector<const TensorInfo*>& inputs,
28  const TensorInfo& output,
29  const OriginsDescriptor& descriptor)
30 {
31  std::vector<arm_compute::TensorInfo> aclInputs;
32  for (const TensorInfo* input : inputs)
33  {
34  arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(*input, armnn::DataLayout::NCHW);
35  aclInputs.emplace_back(aclInputInfo);
36  }
37  const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output);
38  std::vector<const arm_compute::ITensorInfo*> aclInputPtrs;
39  for (arm_compute::ITensorInfo& input : aclInputs)
40  {
41  aclInputPtrs.emplace_back(&input);
42  }
43 
44  size_t aclAxis = CalcAxis(descriptor);
45  return arm_compute::CLConcatenateLayer::validate(aclInputPtrs, &aclOutputInfo, aclAxis);
46 }
47 
49  const WorkloadInfo& info,
50  const arm_compute::CLCompileContext& clCompileContext)
51 : BaseWorkload<ConcatQueueDescriptor>(descriptor, info)
52 {
53  bool allInputsAreSubtensors = true;
54 
55  // Check that all inputs are sub-tensors
56  for (auto input : descriptor.m_Inputs)
57  {
58  if (!input->GetParent())
59  {
60  // Non sub-tensor input found so we need to execute the concat function
61  allInputsAreSubtensors = false;
62  break;
63  }
64  }
65 
66  if (allInputsAreSubtensors)
67  {
68  // Can skip configuring the concat function since it's not executed
69  return;
70  }
71 
72  std::vector<const arm_compute::ICLTensor *> aclInputs;
73  for (auto input : m_Data.m_Inputs)
74  {
75  arm_compute::ICLTensor& aclInput = armnn::PolymorphicPointerDowncast<IClTensorHandle>(input)->GetTensor();
76  aclInputs.emplace_back(&aclInput);
77  }
78 
79  arm_compute::ICLTensor& output =
80  armnn::PolymorphicPointerDowncast<IClTensorHandle>(m_Data.m_Outputs[0])->GetTensor();
81 
82  // Create the layer function
83  auto layer = std::make_unique<arm_compute::CLConcatenateLayer>();
84 
85  // Configure input and output tensors
86  size_t aclAxis = CalcAxis(descriptor.m_Parameters);
87  layer->configure(clCompileContext, aclInputs, &output, aclAxis);
88 
89  // Prepare
90  layer->prepare();
91  m_Layer = std::move(layer);
92 }
93 
95 {
96  if (m_Layer)
97  {
98  ARMNN_SCOPED_PROFILING_EVENT_CL("ClConcatWorkload_Execute");
99  m_Layer->run();
100  }
101 }
102 
103 } //namespace armnn
#define ARMNN_SCOPED_PROFILING_EVENT_CL(name)
const ConcatQueueDescriptor m_Data
Definition: Workload.hpp:46
Copyright (c) 2021 ARM Limited and Contributors.
An OriginsDescriptor for the ConcatLayer.
Status
enumeration
Definition: Types.hpp:26
void Execute() const override
std::vector< ITensorHandle * > m_Outputs
ClConcatWorkload(const ConcatQueueDescriptor &descriptor, const WorkloadInfo &info, const arm_compute::CLCompileContext &clCompileContext)
arm_compute::Status ClConcatWorkloadValidate(const std::vector< const TensorInfo *> &inputs, const TensorInfo &output, const OriginsDescriptor &descriptor)
Contains information about inputs and outputs to a layer.
std::vector< ITensorHandle * > m_Inputs