8 #include <arm_compute/runtime/NEON/functions/NESplit.h> 20 using namespace armcomputetensorutils;
24 unsigned int CalcAclAxis(
unsigned int numDimensions,
unsigned int splitAxis)
26 return (numDimensions - splitAxis) - 1;
32 const std::vector<std::reference_wrapper<TensorInfo>>& outputs,
33 unsigned int splitAxis)
35 const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input);
37 size_t numOutputs = outputs.size();
39 std::vector<arm_compute::TensorInfo> aclOutputs;
40 aclOutputs.reserve(numOutputs);
42 std::vector<arm_compute::ITensorInfo*> aclOutputPtr;
43 aclOutputPtr.reserve(numOutputs);
45 for (
size_t i = 0u; i < outputs.size(); ++i)
47 aclOutputs.emplace_back(BuildArmComputeTensorInfo(outputs[i]));
48 aclOutputPtr.emplace_back(&aclOutputs.back());
52 return arm_compute::NESplit::validate(&aclInputInfo, aclOutputPtr, aclAxis);
58 bool allOutputsAreSubtensors =
true;
63 if (output && !output->GetParent())
66 allOutputsAreSubtensors =
false;
71 if (allOutputsAreSubtensors)
77 arm_compute::ITensor& input = boost::polymorphic_downcast<IAclTensorHandle*>(
m_Data.
m_Inputs[0])->GetTensor();
79 std::vector<arm_compute::ITensor *> aclOutputs;
82 arm_compute::ITensor& aclOutput = boost::polymorphic_pointer_downcast<IAclTensorHandle>(output)->GetTensor();
83 aclOutputs.emplace_back(&aclOutput);
87 std::unique_ptr<arm_compute::NESplit> layer(
new arm_compute::NESplit());
91 if (splitAxis.size() != 1)
97 layer->configure(&input, aclOutputs, aclAxis);
101 m_Layer.reset(layer.release());
NeonSplitterWorkload(const SplitterQueueDescriptor &descriptor, const WorkloadInfo &info)
#define ARMNN_SCOPED_PROFILING_EVENT_NEON(name)
unsigned int GetNumDimensions() const
LayerDescriptor m_Parameters
std::set< unsigned int > ComputeSplitAxis(const armnn::SplitterDescriptor &desc, const TensorShape &input)
uint32_t GetNumDimensions() const
Get the number of dimensions.
const SplitterQueueDescriptor m_Data
void Execute() const override
std::vector< ITensorHandle * > m_Outputs
std::vector< ITensorHandle * > m_Inputs
arm_compute::Status NeonSplitterWorkloadValidate(const TensorInfo &input, const std::vector< std::reference_wrapper< TensorInfo >> &outputs, unsigned int splitAxis)