ArmNN
 20.02
ClConcatWorkload.cpp
Go to the documentation of this file.
1 //
2 // Copyright © 2017 Arm Ltd. All rights reserved.
3 // SPDX-License-Identifier: MIT
4 //
5 #include "ClConcatWorkload.hpp"
6 #include "ClWorkloadUtils.hpp"
9 #include <cl/ClTensorHandle.hpp>
10 #include <cl/ClLayerSupport.hpp>
11 
12 #include <arm_compute/core/Types.h>
13 #include <arm_compute/runtime/CL/functions/CLConcatenateLayer.h>
14 
15 #include <boost/polymorphic_pointer_cast.hpp>
16 
17 namespace armnn
18 {
19 using namespace armcomputetensorutils;
20 
21 namespace
22 {
23 size_t CalcAxis(const OriginsDescriptor& desc)
24 {
25  return (desc.GetNumDimensions() - desc.GetConcatAxis()) - 1;
26 }
27 } //namespace
28 
29 arm_compute::Status ClConcatWorkloadValidate(const std::vector<const TensorInfo*>& inputs,
30  const TensorInfo& output,
31  const OriginsDescriptor& descriptor)
32 {
33  std::vector<arm_compute::TensorInfo> aclInputs;
34  for (const TensorInfo* input : inputs)
35  {
36  arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(*input, armnn::DataLayout::NCHW);
37  aclInputs.emplace_back(aclInputInfo);
38  }
39  const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output);
40  std::vector<arm_compute::ITensorInfo*> aclInputPtrs;
41  for (arm_compute::ITensorInfo& input : aclInputs)
42  {
43  aclInputPtrs.emplace_back(&input);
44  }
45 
46  size_t aclAxis = CalcAxis(descriptor);
47  return arm_compute::CLConcatenateLayer::validate(aclInputPtrs, &aclOutputInfo, aclAxis);
48 }
49 
51 : BaseWorkload<ConcatQueueDescriptor>(descriptor, info)
52 {
53  bool allInputsAreSubtensors = true;
54 
55  // Check that all inputs are sub-tensors
56  for (auto input : descriptor.m_Inputs)
57  {
58  if (!input->GetParent())
59  {
60  // Non sub-tensor input found so we need to execute the concat function
61  allInputsAreSubtensors = false;
62  break;
63  }
64  }
65 
66  if (allInputsAreSubtensors)
67  {
68  // Can skip configuring the concat function since it's not executed
69  return;
70  }
71 
72  std::vector<arm_compute::ICLTensor *> aclInputs;
73  for (auto input : m_Data.m_Inputs)
74  {
75  arm_compute::ICLTensor& aclInput = boost::polymorphic_pointer_downcast<IClTensorHandle>(input)->GetTensor();
76  aclInputs.emplace_back(&aclInput);
77  }
78  arm_compute::ICLTensor& output = boost::polymorphic_pointer_downcast<IClTensorHandle>(
79  m_Data.m_Outputs[0])->GetTensor();
80 
81  // Create the layer function
82  auto layer = std::make_unique<arm_compute::CLConcatenateLayer>();
83 
84  // Configure input and output tensors
85  size_t aclAxis = CalcAxis(descriptor.m_Parameters);
86  layer->configure(aclInputs, &output, aclAxis);
87 
88  // Prepare
89  layer->prepare();
90  m_Layer = std::move(layer);
91 }
92 
94 {
95  if (m_Layer)
96  {
97  ARMNN_SCOPED_PROFILING_EVENT_CL("ClConcatWorkload_Execute");
98  m_Layer->run();
99  }
100 }
101 
102 } //namespace armnn
#define ARMNN_SCOPED_PROFILING_EVENT_CL(name)
const ConcatQueueDescriptor m_Data
Definition: Workload.hpp:46
Copyright (c) 2020 ARM Limited.
An OriginsDescriptor for the ConcatLayer.
Status
enumeration
Definition: Types.hpp:26
void Execute() const override
std::vector< ITensorHandle * > m_Outputs
ClConcatWorkload(const ConcatQueueDescriptor &descriptor, const WorkloadInfo &info)
arm_compute::Status ClConcatWorkloadValidate(const std::vector< const TensorInfo *> &inputs, const TensorInfo &output, const OriginsDescriptor &descriptor)
Contains information about inputs and outputs to a layer.
std::vector< ITensorHandle * > m_Inputs