// // Copyright © 2017-2024 Arm Ltd and Contributors. All rights reserved. // SPDX-License-Identifier: MIT // #include "SplitterLayer.hpp" #include "LayerCloneBase.hpp" #include #include #include #include namespace armnn { SplitterLayer::SplitterLayer(const ViewsDescriptor& param, const char* name) : LayerWithParameters(1, param.GetNumViews(), LayerType::Splitter, param, name) { } std::unique_ptr SplitterLayer::CreateWorkload(const IWorkloadFactory& factory) const { SplitterQueueDescriptor descriptor; // Copies the window origins to the descriptor. for (unsigned int i = 0; i < m_Param.GetNumViews(); ++i) { descriptor.m_ViewOrigins.emplace_back( std::vector(m_Param.GetViewOrigin(i), m_Param.GetViewOrigin(i) + m_Param.GetNumDimensions())); } SetAdditionalInfo(descriptor); return factory.CreateWorkload(LayerType::Splitter, descriptor, PrepInfoAndDesc(descriptor)); } template void SplitterLayer::CreateTensors(const TensorHandleFactoryRegistry& registry, const FactoryType& factory, bool isMemoryManaged) { //If sub tensors are supported than all the "splitter" need to do is to //set the outputs to be appropriate sub tensors of the input. bool useSubTensors = factory.SupportsSubTensors(); if (useSubTensors) { // Get outputHandler of previous layer const OutputHandler& outputHandler = GetInputSlots()[0].GetConnectedOutputSlot()->GetOutputHandler(); const OutputSlot* slot = GetInputSlots()[0].GetConnectedOutputSlot(); const TensorInfo& parentInfo = GetInputSlot(0).GetTensorInfo(); ITensorHandle* inputData = outputHandler.GetData(); std::vector> subTensors; // check if split is along the x or y (2 innermost dimensions) auto numberOfDimensions = m_Param.GetNumDimensions(); std::set axis = ComputeSplitAxis(m_Param, parentInfo.GetShape()); std::set::iterator axisIt = axis.begin(); bool isOnXorY = m_Param.GetNumDimensions() >= 3 && ((*axisIt == numberOfDimensions - 1) || (*axisIt == numberOfDimensions - 2)); //Creates the outputs as subtensors of the input. for (unsigned int i = 0; i < m_Param.GetNumViews(); ++i) { const TensorInfo& info = m_OutputHandlers[i].GetTensorInfo(); OutputSlot& outSlot = GetOutputSlot(i); ITensorHandleFactory::FactoryId factoryId = outSlot.GetTensorHandleFactoryId(); const unsigned int numOutputSlots = GetNumOutputSlots(); // if split along x or y (2 innermost dimensions) and the next layers do not require padding bool canUseSubTensorOnXorY = true; bool isTensorHandleFactory = std::is_same::value; if (isTensorHandleFactory) { for (unsigned int it = 0; it < numOutputSlots; ++it) { InputSlot* inputSlot = GetOutputSlot(it).GetConnection(0); ITensorHandleFactory* handleFactory = registry.GetFactory(factoryId); std::vector capabilities = handleFactory->GetCapabilities(&(inputSlot->GetOwningLayer()), this, CapabilityClass::PaddingRequired); if (isOnXorY) { canUseSubTensorOnXorY = false; if (capabilities.empty()) { canUseSubTensorOnXorY = true; } } if (!canUseSubTensorOnXorY) { break; } } } auto CreateSubTensor = [&]() { // Make sure: // 1) quantization parameters are in the same space // 2) the same TensorHandleFactory is used for input and split layer output // 3) the output does not go to a Constant layer or input layer // 4) if split along x or y (2 innermost dimensions) and the next layers do not require padding if (parentInfo.IsTypeSpaceMatch(info) && //(1) factoryId == slot->GetTensorHandleFactoryId() && //(2) GetOutputSlot(i).GetConnection(0)->GetOwningLayer().GetType() != LayerType::Constant && //(3) GetOutputSlot(i).GetConnection(0)->GetOwningLayer().GetType() != LayerType::Input && //(3) canUseSubTensorOnXorY) //(4) { ARMNN_NO_DEPRECATE_WARN_BEGIN return factory.CreateSubTensorHandle(*inputData, info.GetShape(), this->m_Param.GetViewOrigin(i)); ARMNN_NO_DEPRECATE_WARN_END } return std::unique_ptr(); }; auto subTensor = CreateSubTensor(); if (!subTensor) { useSubTensors = false; break; //Failed to create a valid sub-tensor, so stop trying with the rest of the views. } subTensors.push_back(std::move(subTensor)); } if (useSubTensors) { unsigned int i = 0; for (auto& subTensor : subTensors) { m_OutputHandlers[i].SetData(std::move(subTensor)); ++i; } } } if (!useSubTensors) { for (unsigned int i = 0; i < m_Param.GetNumViews(); ++i) { m_OutputHandlers[i].CreateTensorHandles(factory, isMemoryManaged); } } } void SplitterLayer::CreateTensorHandles(const TensorHandleFactoryRegistry& registry, const IWorkloadFactory& workloadFactory, const bool isMemoryManaged) { OutputSlot& slot = GetOutputSlot(0); ITensorHandleFactory::FactoryId factoryId = slot.GetTensorHandleFactoryId(); if (factoryId == ITensorHandleFactory::LegacyFactoryId) { CreateTensors(registry, workloadFactory, isMemoryManaged); } else { ITensorHandleFactory* handleFactory = registry.GetFactory(factoryId); if (!handleFactory) { throw armnn::NullPointerException("handleFactory is returning a nullptr."); } CreateTensors(registry, *handleFactory, isMemoryManaged); } } SplitterLayer* SplitterLayer::Clone(Graph& graph) const { return CloneBase(graph, m_Param, GetName()); } std::vector SplitterLayer::InferOutputShapes(const std::vector& inputShapes) const { if (inputShapes.size() != m_Param.GetNumViews()) { throw armnn::Exception("inputShapes' and m_NumViews' sizes do not match (\"" + std::to_string(inputShapes.size()) + "\" vs \"" + std::to_string(m_Param.GetNumViews()) + "\")"); } std::vector outShapes; //Output shapes must match View shapes. for (unsigned int viewIdx = 0; viewIdx < m_Param.GetNumViews(); viewIdx++) { const uint32_t* sizes = m_Param.GetViewSizes(viewIdx); outShapes.push_back(TensorShape(m_Param.GetNumDimensions(), sizes)); } return outShapes; } void SplitterLayer::ValidateTensorShapesFromInputs() { std::for_each(BeginOutputSlots(), EndOutputSlots(), [&](OutputSlot& outputSlot) { VerifyShapeInferenceType(outputSlot.GetTensorInfo().GetShape(), m_ShapeInferenceMethod); }); std::vector views; for (unsigned int viewIdx = 0; viewIdx < m_Param.GetNumViews(); viewIdx++) { const uint32_t* sizes = m_Param.GetViewSizes(viewIdx); views.push_back(TensorShape(m_Param.GetNumDimensions(), sizes)); } auto inferredShapes = InferOutputShapes(views); if (inferredShapes.size() != m_Param.GetNumViews()) { throw armnn::LayerValidationException("inferredShapes' size and m_NumViews do not match (\"" + std::to_string(inferredShapes.size()) + "\" vs \"" + std::to_string(m_Param.GetNumViews()) + "\")"); } for (unsigned int viewIdx = 0; viewIdx < m_Param.GetNumViews(); viewIdx++) { ValidateAndCopyShape(GetOutputSlot(viewIdx).GetTensorInfo().GetShape(), inferredShapes[viewIdx], m_ShapeInferenceMethod, "SplitterLayer", viewIdx); } } void SplitterLayer::ExecuteStrategy(IStrategy& strategy) const { strategy.ExecuteStrategy(this, GetParameters(), {}, GetName()); } } // namespace armnn