#include <LoadedNetwork.hpp>

Public Types
using	WorkloadQueue = std::vector< std::unique_ptr< IWorkload > >

using	ExecutionTuple = std::tuple< InputTensors, OutputTensors, std::shared_ptr< IAsyncExecutionCallback > >

using	ExecutionQueue = std::queue< std::shared_ptr< ExecutionTuple > >

Public Member Functions
	~LoadedNetwork ()

std::unique_ptr< IWorkingMemHandle >	CreateWorkingMemHandle (NetworkId networkId)
	Create a new unique WorkingMemHandle object. More...

TensorInfo	GetInputTensorInfo (LayerBindingId layerId) const

TensorInfo	GetOutputTensorInfo (LayerBindingId layerId) const

Status	EnqueueWorkload (const InputTensors &inputTensors, const OutputTensors &outputTensors)
	Single thread execution of the loaded network. More...

Status	Execute (const InputTensors &inputTensors, const OutputTensors &outputTensors, IWorkingMemHandle &workingMemHandle)
	Thread safe execution of the loaded network. More...

void	Schedule (const InputTensors &inputTensors, const OutputTensors &outputTensors, const QosExecPriority priority, std::shared_ptr< IAsyncExecutionCallback > cb)
	Schedule an asynchronous execution on the loaded network. More...

const std::shared_ptr< IProfiler > &	GetProfiler () const

void	FreeWorkingMemory ()

void	RegisterDebugCallback (const DebugCallbackFunction &func)

void	SendNetworkStructure ()

bool	IsAsyncEnabled ()

profiling::ProfilingGuid	GetNetworkGuid ()

Static Public Member Functions
static std::unique_ptr< LoadedNetwork >	MakeLoadedNetwork (std::unique_ptr< IOptimizedNetwork > net, std::string &errorMessage, const INetworkProperties &networkProperties, profiling::ProfilingService &profilingService, const NetworkId networkIdOut)

Detailed Description

Definition at line 35 of file LoadedNetwork.hpp.

Member Typedef Documentation

◆ ExecutionQueue

using ExecutionQueue = std::queue<std::shared_ptr<ExecutionTuple> >

Definition at line 44 of file LoadedNetwork.hpp.

◆ ExecutionTuple

using ExecutionTuple = std::tuple<InputTensors, OutputTensors, std::shared_ptr<IAsyncExecutionCallback> >

Definition at line 42 of file LoadedNetwork.hpp.

◆ WorkloadQueue

using WorkloadQueue = std::vector<std::unique_ptr<IWorkload> >

Definition at line 38 of file LoadedNetwork.hpp.

Constructor & Destructor Documentation

◆ ~LoadedNetwork()

~LoadedNetwork ( )

inline

Definition at line 46 of file LoadedNetwork.hpp.

     {
         FreeWorkingMemory();
         TerminateThreadPool();
     }

Member Function Documentation

◆ CreateWorkingMemHandle()

std::unique_ptr< IWorkingMemHandle > CreateWorkingMemHandle ( NetworkId networkId )

Create a new unique WorkingMemHandle object.

Create multiple handles if you wish to have overlapped Execution by calling this function from different threads.

Definition at line 1258 of file LoadedNetwork.cpp.

References ITensorHandle::Allocate(), ARMNN_ASSERT, ARMNN_NO_DEPRECATE_WARN_BEGIN, ARMNN_NO_DEPRECATE_WARN_END, armnn::Constant, ITensorHandleFactory::CreateTensorHandle(), Layer::GetBackendId(), TensorHandleFactoryRegistry::GetFactory(), Layer::GetGuid(), Layer::GetInputSlots(), TensorHandleFactoryRegistry::GetMemoryManagers(), Layer::GetNumOutputSlots(), Layer::GetOutputSlots(), Layer::GetType(), armnn::Input, ITensorHandleFactory::LegacyFactoryId, WorkingMemDescriptor::m_Inputs, WorkingMemDescriptor::m_Outputs, ITensorHandle::Manage(), armnn::MemImport, and armnn::Output.

Referenced by RuntimeImpl::CreateWorkingMemHandle().

 {
     Graph& order = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph();
     std::unordered_map<LayerGuid, std::vector<std::unique_ptr<ITensorHandle> > > tensorHandleMap;
     std::vector<WorkingMemDescriptor> workingMemDescriptors;
     std::unordered_map<LayerGuid, WorkingMemDescriptor> workingMemDescriptorMap;
     TensorHandleFactoryRegistry tensorHandleFactoryRegistry;
     WorkloadFactoryMap workloadFactoryMap;
 
     std::vector<std::shared_ptr<IMemoryManager>> memoryManagers;
 
     for (auto const& backend : m_Backends)
     {
         if (backend.second->SupportsTensorAllocatorAPI())
         {
             backend.second->RegisterTensorHandleFactories(
                 tensorHandleFactoryRegistry,
                 static_cast<MemorySourceFlags>(m_NetworkProperties.m_InputSource),
                 static_cast<MemorySourceFlags>(m_NetworkProperties.m_OutputSource));
             memoryManagers.emplace_back(tensorHandleFactoryRegistry.GetMemoryManagers().back());
         }
         else
         {
             std::shared_ptr<IMemoryManager> memoryManager = backend.second->CreateMemoryManager();
             auto workloadFactory = backend.second->CreateWorkloadFactory(
                     memoryManager, m_OptimizedNetwork->pOptimizedNetworkImpl->GetModelOptions());
 
             workloadFactoryMap.emplace(
                     std::make_pair(backend.first, std::make_pair(std::move(workloadFactory), memoryManager)));
             memoryManagers.emplace_back(memoryManager);
         }
     }
 
     auto GetTensorHandle = [&](Layer* layer, const OutputSlot& outputSlot, bool isMemoryManaged)
     {
         ITensorHandleFactory::FactoryId factoryId = outputSlot.GetTensorHandleFactoryId();
         const TensorInfo& tensorInfo = outputSlot.GetTensorInfo();
 
         if (factoryId == ITensorHandleFactory::LegacyFactoryId)
         {
             BackendId id = layer->GetBackendId();
             ARMNN_NO_DEPRECATE_WARN_BEGIN
             return workloadFactoryMap.at(id).first->CreateTensorHandle(tensorInfo, isMemoryManaged);
             ARMNN_NO_DEPRECATE_WARN_END
         }
         else
         {
             ITensorHandleFactory* handleFactory = tensorHandleFactoryRegistry.GetFactory(factoryId);
             ARMNN_ASSERT(handleFactory);
             return handleFactory->CreateTensorHandle(tensorInfo, isMemoryManaged);
         }
     };
 
     std::unordered_map<const ITensorHandle*, unsigned int> handleReferenceCounts;
     for (auto&& layer : order)
     {
         WorkingMemDescriptor workingMemDescriptor;
 
         // Constant layers execution and management is handled during loaded network construction
         if (layer->GetType() == LayerType::Constant)
         {
             continue;
         }
         bool isMemoryManaged = true;
         bool isInputLayer = true;
         // Look for the layer with 1 OutputSlot which has 1 connection and that connection is an Output Layer
         // If Export is enabled disable memory management so we can export, otherwise we do a copy
         if ((layer->GetNumOutputSlots() == 1) &&
             (layer->GetOutputSlots()[0].GetNumConnections() == 1) &&
             (layer->GetOutputSlots()[0].GetConnection(0)->GetOwningLayer().GetType() == LayerType::Output))
         {
             isMemoryManaged = !m_NetworkProperties.m_ExportEnabled;
         }
         else if (layer->GetType() == LayerType::Input || layer->GetType() == LayerType::MemImport)
         {
             // Input layers/workloads will not be executed so the descriptor is not added to workingMemDescriptors
             // However we will still need to manage the tensorHandle
             isInputLayer = false;
             isMemoryManaged = !m_NetworkProperties.m_ExportEnabled;
         }
 
         // Create a tensor handle for each output slot of a layer
         // Once we create it, we start managing its lifetime
         for (auto& slot : layer->GetOutputSlots())
         {
             tensorHandleMap[layer->GetGuid()].emplace_back(GetTensorHandle(layer, slot, isMemoryManaged));
             ITensorHandle* tensorHandle = tensorHandleMap[layer->GetGuid()].back().get();
 
             workingMemDescriptor.m_Outputs.push_back(tensorHandle);
             tensorHandle->Manage();
             unsigned int numConnections = slot.GetNumConnections();
             ARMNN_ASSERT(numConnections != 0);
 
             handleReferenceCounts[tensorHandle] = numConnections;
         }
         // Loop through the input slots in the same layer and decrement the reference counter associated
         // to each tensor handle we encounter.
         // Once it reaches zero, the lifetime of the tensor handle has ended, and we mark it's memory as available
         // so that the next tensor handle with a non overlapping lifetime can share it's memory.
         for (auto& slot : layer->GetInputSlots())
         {
             ARMNN_ASSERT(slot.GetConnection());
             auto outputSlot = slot.GetConnectedOutputSlot();
             auto key = outputSlot->GetOwningLayer().GetGuid();
 
             // Constant layers execution and management is handled during loaded network construction
             auto found = m_ConstantTensorHandles.find(key);
             if (found != m_ConstantTensorHandles.end())
             {
                 workingMemDescriptor.m_Inputs.push_back(found->second);
                 continue;
             }
 
             auto search = tensorHandleMap.find(key);
             unsigned int index = outputSlot->CalculateIndexOnOwner();
             ITensorHandle* inputTensorHandle = search->second[index].get();
             workingMemDescriptor.m_Inputs.push_back(inputTensorHandle);
             --handleReferenceCounts.at(inputTensorHandle);
             if (handleReferenceCounts.at(inputTensorHandle) == 0u)
             {
                 // Stop managing lifetime of tensor handle
                 inputTensorHandle->Allocate();
                 handleReferenceCounts.erase(inputTensorHandle);
             }
         }
         workingMemDescriptorMap.insert({layer->GetGuid(), workingMemDescriptor});
 
         // Input layers/workloads will not be executed, so the descriptor is not added to workingMemDescriptors
         // However we will still need to manage the tensorHandle
         if (isInputLayer)
         {
             workingMemDescriptors.push_back(workingMemDescriptor);
         }
     }
 
     return std::make_unique<WorkingMemHandle>(networkId,
                                               workingMemDescriptors,
                                               workingMemDescriptorMap,
                                               memoryManagers,
                                               std::move(tensorHandleMap));
 }

◆ EnqueueWorkload()

Status EnqueueWorkload	(	const InputTensors &	inputTensors,
		const OutputTensors &	outputTensors
	)

Single thread execution of the loaded network.

Definition at line 535 of file LoadedNetwork.cpp.

References ARMNN_ASSERT_MSG, ARMNN_LOG, LabelsAndEventClasses::ARMNN_PROFILING_EOL_EVENT_CLASS, LabelsAndEventClasses::ARMNN_PROFILING_SOL_EVENT_CLASS, ARMNN_SCOPED_HEAP_PROFILING, ARMNN_SCOPED_PROFILING_EVENT, armnn::CheckFlag(), LabelsAndEventClasses::EXECUTION_OF_GUID, armnn::Failure, ITensorHandle::GetImportFlags(), Graph::GetInputLayers(), Layer::GetInputSlots(), Graph::GetNumInputs(), Layer::GetNumInputSlots(), Graph::GetNumLayers(), Graph::GetNumOutputs(), Layer::GetNumOutputSlots(), Layer::GetOutputHandler(), Graph::GetOutputLayers(), TimelineUtilityMethods::GetTimelineUtils(), Layer::GetType(), armnn::IgnoreUnused(), ITensorHandle::Import(), LabelsAndEventClasses::INFERENCE_GUID, armnn::info, armnn::Input, QueueDescriptor::m_Inputs, WorkloadInfo::m_InputTensorInfos, QueueDescriptor::m_Outputs, WorkloadInfo::m_OutputTensorInfos, ITensorHandle::Map(), armnn::Output, armnn::Success, armnn::Undefined, ITensorHandle::Unmap(), and armnn::warning.

Referenced by RuntimeImpl::EnqueueWorkload().

 {
     const Graph& graph = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph();
 
     // Walk graph to determine the order of execution.
     if (graph.GetNumLayers() < 2)
     {
         ARMNN_LOG(warning) << "IRuntime::EnqueueWorkload()::Less than two nodes in graph";
         return Status::Failure;
     }
 
     // Data that must be kept alive for the entire execution of the workload.
     WorkloadData workloadData(inputTensors, outputTensors);
 
     if (graph.GetNumInputs() != inputTensors.size())
     {
         throw InvalidArgumentException("Number of inputs provided does not match network.");
     }
 
     // For each input to the network, call EnqueueInput with the data passed by the user.
     {
         ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "PrepareInputs");
         m_InputQueue.clear();
         m_InputQueue.reserve(graph.GetNumInputs());
         for (const BindableLayer* inputLayer : graph.GetInputLayers())
         {
             const TensorPin& pin = workloadData.GetInputTensorPin(inputLayer->GetBindingId());
             EnqueueInput(*inputLayer, pin.GetTensorHandle(), pin.GetTensorInfo());
         }
     }
 
     // For each output to the network, call EnqueueOutput with the data passed by the user.
     {
         ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "PrepareOutputs");
         m_OutputQueue.clear();
         m_OutputQueue.reserve(graph.GetNumOutputs());
         for (const BindableLayer* outputLayer : graph.GetOutputLayers())
         {
             const TensorPin& pin = workloadData.GetOutputTensorPin(outputLayer->GetBindingId());
             EnqueueOutput(*outputLayer, pin.GetTensorHandle(), pin.GetTensorInfo());
         }
     }
 
     std::unique_ptr<TimelineUtilityMethods> timelineUtils =
                         TimelineUtilityMethods::GetTimelineUtils(m_ProfilingService);
     ProfilingGuid inferenceGuid = m_ProfilingService.GetNextGuid();
     if (timelineUtils)
     {
         // Add inference timeline trace if profiling is enabled.
         ProfilingGuid networkGuid = m_OptimizedNetwork->GetGuid();
         timelineUtils->CreateTypedEntity(inferenceGuid, LabelsAndEventClasses::INFERENCE_GUID);
         timelineUtils->CreateRelationship(ProfilingRelationshipType::RetentionLink,
                                           networkGuid,
                                           inferenceGuid,
                                           LabelsAndEventClasses::EXECUTION_OF_GUID);
         timelineUtils->RecordEvent(inferenceGuid, LabelsAndEventClasses::ARMNN_PROFILING_SOL_EVENT_CLASS);
     }
 
     bool executionSucceeded = true;
 
     {
         if (m_ProfilingService.IsProfilingEnabled())
         {
             m_ProfilingService.IncrementCounterValue(armnn::profiling::INFERENCES_RUN);
         }
         ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "Execute");
         ARMNN_SCOPED_HEAP_PROFILING("Executing");
         executionSucceeded = Execute(timelineUtils, inferenceGuid);
     }
 
     if (timelineUtils)
     {
         // Add end of life of the inference timeline if profiling is enabled.
         timelineUtils->RecordEvent(inferenceGuid, LabelsAndEventClasses::ARMNN_PROFILING_EOL_EVENT_CLASS);
         timelineUtils->Commit();
     }
     return executionSucceeded ? Status::Success : Status::Failure;
 }

◆ Execute()

Status Execute	(	const InputTensors &	inputTensors,
		const OutputTensors &	outputTensors,
		IWorkingMemHandle &	workingMemHandle
	)

Thread safe execution of the loaded network.

Definition at line 1154 of file LoadedNetwork.cpp.

References WorkingMemHandle::Allocate(), ARMNN_LOG, LabelsAndEventClasses::ARMNN_PROFILING_EOL_EVENT_CLASS, LabelsAndEventClasses::ARMNN_PROFILING_SOL_EVENT_CLASS, ARMNN_SCOPED_PROFILING_EVENT, armnn::error, LabelsAndEventClasses::EXECUTION_OF_GUID, armnn::Failure, Graph::GetInputLayers(), armnn::GetInputTensor(), WorkingMemHandle::GetMutex(), Graph::GetNumInputs(), Graph::GetNumLayers(), Graph::GetOutputLayers(), armnn::GetOutputTensor(), TimelineUtilityMethods::GetTimelineUtils(), WorkingMemHandle::GetWorkingMemDescriptorAt(), LabelsAndEventClasses::INFERENCE_GUID, WorkingMemHandle::IsAllocated(), armnn::profiling::RetentionLink, armnn::Success, armnn::Undefined, and armnn::warning.

Referenced by RuntimeImpl::Execute(), and LoadedNetwork::FreeWorkingMemory().

 {
     const Graph& graph = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph();
 
     // Walk graph to determine the order of execution.
     if (graph.GetNumLayers() < 2)
     {
         ARMNN_LOG(warning) << "IRuntime::EnqueueWorkload()::Less than two nodes in graph";
         return Status::Failure;
     }
 
     if (graph.GetNumInputs() != inputTensors.size())
     {
         throw InvalidArgumentException("Number of inputs provided does not match network.");
     }
 
     std::unique_ptr<profiling::TimelineUtilityMethods> timelineUtils =
             profiling::TimelineUtilityMethods::GetTimelineUtils(m_ProfilingService);
     profiling::ProfilingGuid inferenceGuid = m_ProfilingService.GetNextGuid();
     if (timelineUtils)
     {
         // Add inference timeline trace if profiling is enabled.
         profiling::ProfilingGuid networkGuid = m_OptimizedNetwork->GetGuid();
         timelineUtils->CreateTypedEntity(inferenceGuid, profiling::LabelsAndEventClasses::INFERENCE_GUID);
         timelineUtils->CreateRelationship(profiling::ProfilingRelationshipType::RetentionLink,
                                           networkGuid,
                                           inferenceGuid,
                                           profiling::LabelsAndEventClasses::EXECUTION_OF_GUID);
         timelineUtils->RecordEvent(inferenceGuid, profiling::LabelsAndEventClasses::ARMNN_PROFILING_SOL_EVENT_CLASS);
     }
 
     bool executionSucceeded = true;
 
     if (timelineUtils)
     {
         // Add end of life of the inference timeline if profiling is enabled.
         timelineUtils->RecordEvent(inferenceGuid, profiling::LabelsAndEventClasses::ARMNN_PROFILING_EOL_EVENT_CLASS);
         timelineUtils->Commit();
     }
     WorkingMemHandle& workingMemHandle = dynamic_cast<WorkingMemHandle&>(iWorkingMemHandle);
     std::lock_guard<std::mutex> lockGuard(workingMemHandle.GetMutex());
 
     if (!workingMemHandle.IsAllocated())
     {
         workingMemHandle.Allocate();
     }
 
     {
         ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "PrepareInputs");
         for (const BindableLayer* inputLayer : graph.GetInputLayers())
         {
             EnqueueInput(*inputLayer, GetInputTensor(inputLayer->GetBindingId(), inputTensors), workingMemHandle);
         }
     }
 
     auto Fail = [&](const std::exception& error)
     {
         ARMNN_LOG(error) << "An error occurred attempting to execute a workload: " << error.what();
         executionSucceeded = false;
     };
     profiling::ProfilingDynamicGuid workloadInferenceID(0);
 
     try
     {
         for (unsigned int i = 0; i < m_WorkloadQueue.size(); ++i)
         {
             auto& workload = m_WorkloadQueue[i];
             if (timelineUtils)
             {
                 workloadInferenceID = timelineUtils->RecordWorkloadInferenceAndStartOfLifeEvent(workload->GetGuid(),
                                                                                                 inferenceGuid);
             }
             workload->ExecuteAsync(workingMemHandle.GetWorkingMemDescriptorAt(i));
 
             if (timelineUtils)
             {
                 timelineUtils->RecordEndOfLifeEvent(workloadInferenceID);
             }
         }
     }
     catch (const RuntimeException& error)
     {
         Fail(error);
     }
     catch (const std::runtime_error& error)
     {
         Fail(error);
     }
     // For each output to the network, call EnqueueOutput with the data passed by the user.
     {
         ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "PrepareOutputs");
         for (const BindableLayer *outputLayer : graph.GetOutputLayers())
         {
             EnqueueOutput(*outputLayer, GetOutputTensor(outputLayer->GetBindingId(), outputTensors), workingMemHandle);
         }
     }
 
     return executionSucceeded ? Status::Success : Status::Failure;
 }

◆ FreeWorkingMemory()

void FreeWorkingMemory ( )

Definition at line 791 of file LoadedNetwork.cpp.

References ARMNN_LOG, armnn::error, and LoadedNetwork::Execute().

Referenced by RuntimeImpl::CreateWorkingMemHandle(), and RuntimeImpl::EnqueueWorkload().

 {
     std::lock_guard<std::mutex> lockGuard(m_WorkingMemMutex);
     if (!m_IsWorkingMemAllocated)
     {
         return;
     }
     // Informs the memory managers to release memory in it's respective memory group
     for (auto&& workloadFactory : m_WorkloadFactories)
     {
         IBackendInternal::IMemoryManagerSharedPtr memoryManager = workloadFactory.second.second;
         if (memoryManager)
         {
             memoryManager->Release();
         }
     }
     m_TensorHandleFactoryRegistry.ReleaseMemory();
     m_IsWorkingMemAllocated = false;
 }

◆ GetInputTensorInfo()

TensorInfo GetInputTensorInfo ( LayerBindingId layerId ) const

Definition at line 386 of file LoadedNetwork.cpp.

References ARMNN_ASSERT_MSG.

Referenced by RuntimeImpl::GetInputTensorInfo().

 {
     for (auto&& inputLayer : m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().GetInputLayers())
     {
         ARMNN_ASSERT_MSG(inputLayer->GetNumOutputSlots() == 1, "Input layer should have exactly 1 output slot");
         if (inputLayer->GetBindingId() == layerId)
         {
             return inputLayer->GetOutputSlot(0).GetTensorInfo();
         }
     }
 
     throw InvalidArgumentException(fmt::format("No input layer is associated with id {}", layerId));
 }

◆ GetNetworkGuid()

profiling::ProfilingGuid GetNetworkGuid ( )

Definition at line 381 of file LoadedNetwork.cpp.

 {
     return m_OptimizedNetwork->GetGuid();
 }

◆ GetOutputTensorInfo()

TensorInfo GetOutputTensorInfo ( LayerBindingId layerId ) const

Definition at line 400 of file LoadedNetwork.cpp.

References ARMNN_ASSERT_MSG, CHECK_LOCATION, BackendId::Get(), Layer::GetBackendId(), Layer::GetNameStr(), armnn::IgnoreUnused(), armnn::info, and IWorkloadFactory::IsLayerSupported().

Referenced by RuntimeImpl::GetOutputTensorInfo().

 {
     for (auto&& outputLayer : m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().GetOutputLayers())
     {
         ARMNN_ASSERT_MSG(outputLayer->GetNumInputSlots() == 1, "Output layer should have exactly 1 input slot");
         ARMNN_ASSERT_MSG(outputLayer->GetInputSlot(0).GetConnection(), "Input slot on Output layer must be connected");
         if (outputLayer->GetBindingId() == layerId)
         {
             return outputLayer->GetInputSlot(0).GetConnection()->GetTensorInfo();
         }
     }
 
     throw InvalidArgumentException(fmt::format("No output layer is associated with id {}", layerId));
 }

◆ GetProfiler()

const std::shared_ptr<IProfiler>& GetProfiler ( ) const

inline

Definition at line 82 of file LoadedNetwork.hpp.

Referenced by RuntimeImpl::CreateWorkingMemHandle(), RuntimeImpl::EnqueueWorkload(), RuntimeImpl::Execute(), and RuntimeImpl::Schedule().

82 { return m_Profiler; }

◆ IsAsyncEnabled()

bool IsAsyncEnabled ( )

inline

Definition at line 90 of file LoadedNetwork.hpp.

Referenced by RuntimeImpl::CreateWorkingMemHandle(), RuntimeImpl::EnqueueWorkload(), RuntimeImpl::Execute(), and RuntimeImpl::Schedule().

     {
         return m_NetworkProperties.m_AsyncEnabled;
     }

◆ MakeLoadedNetwork()

std::unique_ptr< LoadedNetwork > MakeLoadedNetwork	(	std::unique_ptr< IOptimizedNetwork >	net,
		std::string &	errorMessage,
		const INetworkProperties &	networkProperties,
		profiling::ProfilingService &	profilingService,
		const NetworkId	networkIdOut
	)

static

Definition at line 85 of file LoadedNetwork.cpp.

References ITensorHandle::Allocate(), ARMNN_ASSERT, ARMNN_LOG, LabelsAndEventClasses::ARMNN_PROFILING_SOL_EVENT_CLASS, armnn::BackendRegistryInstance(), armnn::Constant, IBackendInternal::CreateMemoryManager(), IBackendInternal::CreateWorkloadFactory(), armnn::error, armnnUtils::Processes::GetCurrentId(), BackendRegistry::GetFactory(), ProfilerManager::GetInstance(), TimelineUtilityMethods::GetTimelineUtils(), armnn::Input, ITensorHandleFactory::LegacyFactoryId, INetworkProperties::m_AsyncEnabled, WorkingMemDescriptor::m_Outputs, armnn::MemImport, LabelsAndEventClasses::NETWORK_GUID, armnn::Output, LabelsAndEventClasses::PROCESS_ID_GUID, ProfilerManager::RegisterProfiler(), IBackendInternal::SupportsTensorAllocatorAPI(), and Graph::TopologicalSort().

Referenced by RuntimeImpl::LoadNetwork().

 {
     std::unique_ptr<LoadedNetwork> loadedNetwork;
 
     auto Fail = [&](const std::exception& error) -> std::unique_ptr<LoadedNetwork>
     {
         errorMessage = ToErrorMessage("An error occurred when preparing the network workloads: ", error);
         ARMNN_LOG(error) << errorMessage;
 
         return std::unique_ptr<LoadedNetwork>();
     };
 
     try
     {
         loadedNetwork.reset(new LoadedNetwork(std::move(net), networkProperties, profilingService, networkIdOut));
     }
     catch (const armnn::RuntimeException& error)
     {
         return Fail(error);
     }
     catch (const armnn::Exception& error)
     {
         return Fail(error);
     }
     catch (const std::runtime_error& error)
     {
         return Fail(error);
     }
 
     return loadedNetwork;
 }

◆ RegisterDebugCallback()

void RegisterDebugCallback ( const DebugCallbackFunction & func )

Definition at line 1400 of file LoadedNetwork.cpp.

Referenced by RuntimeImpl::RegisterDebugCallback().

 {
     for (auto&& workloadPtr: m_WorkloadQueue)
     {
         workloadPtr.get()->RegisterDebugCallback(func);
     }
 }

◆ Schedule()

void Schedule	(	const InputTensors &	inputTensors,
		const OutputTensors &	outputTensors,
		const QosExecPriority	priority,
		std::shared_ptr< IAsyncExecutionCallback >	cb
	)

Schedule an asynchronous execution on the loaded network.

Definition at line 892 of file LoadedNetwork.cpp.

References ARMNN_ASSERT_MSG, ARMNN_SCOPED_PROFILING_EVENT, armnn::CheckFlag(), armnn::CopyTensorContentsGeneric(), armnn::EXPIRE_RATE, armnn::Failure, Layer::GetGuid(), ITensorHandle::GetImportFlags(), BaseTensor< MemoryType >::GetInfo(), Layer::GetInputSlots(), BaseTensor< MemoryType >::GetMemoryArea(), Layer::GetNumInputSlots(), armnn::GetTimeNow(), Layer::GetType(), WorkingMemHandle::GetWorkingMemDescriptor(), armnn::High, ITensorHandle::Import(), armnn::Input, armnn::Low, WorkingMemDescriptor::m_Inputs, WorkingMemDescriptor::m_Outputs, ITensorHandle::Map(), armnn::Medium, armnn::Output, armnn::Success, armnn::Undefined, and ITensorHandle::Unmap().

Referenced by RuntimeImpl::Schedule().

 {
     // Group execution parameters so that they can be easily added to the queue
     ExecutionTuple groupExecParams = std::make_tuple(inputTensors, outputTensors, cb);
     std::shared_ptr<ExecutionTuple> operation = make_shared<ExecutionTuple>(groupExecParams);
 
     // Add a message to the queue and notify the request thread
     std::unique_lock<std::mutex> lock(m_ThreadPoolMutex);
     switch (priority) {
         case QosExecPriority::High:
             m_HighPriorityQueue.push(operation);
             break;
         case QosExecPriority::Low:
             m_LowPriorityQueue.push(operation);
             break;
         case QosExecPriority::Medium:
         default:
             m_MediumPriorityQueue.push(operation);
     }
     m_ThreadPoolEvent.notify_one();
 }

◆ SendNetworkStructure()

void SendNetworkStructure ( )

Definition at line 344 of file LoadedNetwork.cpp.

References TimelineUtilityMethods::GetTimelineUtils(), armnn::Input, LabelsAndEventClasses::NETWORK_GUID, armnn::Output, and Graph::TopologicalSort().

 {
     Graph& order = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().TopologicalSort();
     ProfilingGuid networkGuid = m_OptimizedNetwork->GetGuid();
 
     std::unique_ptr<TimelineUtilityMethods> timelineUtils =
                         TimelineUtilityMethods::GetTimelineUtils(m_ProfilingService);
 
     timelineUtils->CreateTypedEntity(networkGuid, LabelsAndEventClasses::NETWORK_GUID);
 
     for (auto&& layer : order)
     {
         // Add layer to the post-optimisation network structure
         AddLayerStructure(timelineUtils, *layer, networkGuid);
         switch (layer->GetType())
         {
         case LayerType::Input:
         case LayerType::Output:
         {
             // Inputs and outputs are treated in a special way - see EnqueueInput() and EnqueueOutput().
             break;
         }
         default:
             {
             for (auto& workload : m_WorkloadQueue)
             {
                 // Add workload to the post-optimisation network structure
                 AddWorkloadStructure(timelineUtils, workload, *layer);
             }
             break;
             }
         }
     }
     // Commit to send the post-optimisation network structure
     timelineUtils->Commit();
 }

The documentation for this class was generated from the following files:

src/armnn/LoadedNetwork.hpp
src/armnn/LoadedNetwork.cpp

Public Types

Public Member Functions

Static Public Member Functions

Detailed Description

Member Typedef Documentation

◆ ExecutionQueue

◆ ExecutionTuple

◆ WorkloadQueue

Constructor & Destructor Documentation

◆ ~LoadedNetwork()

Member Function Documentation

◆ CreateWorkingMemHandle()

◆ EnqueueWorkload()

◆ Execute()

◆ FreeWorkingMemory()

◆ GetInputTensorInfo()

◆ GetNetworkGuid()

◆ GetOutputTensorInfo()

◆ GetProfiler()

◆ IsAsyncEnabled()

◆ MakeLoadedNetwork()

◆ RegisterDebugCallback()

◆ Schedule()

◆ SendNetworkStructure()