IVGCVSW-5790 Merge async prototype

* Added thread safe execution mechanism for armnn * Removed duplicate function bool Compare(T a, T b, float tolerance) * Added StridedSliceAsyncEndToEndTest * Fixed memory leak Signed-off-by: Mike Kelly <mike.kelly@arm.com> Change-Id: I2d367fc77ee7c01b8953138543e76af5e691211f
author: Mike Kelly <mike.kelly@arm.com> 2021-03-29 15:04:50 +0100
committer: mike.kelly <mike.kelly@arm.com> 2021-03-29 14:03:30 +0000
commit: 386ff1a721cdca3689b009ba31f2d3ac8bea2fae (patch)
tree: e2f5c26ab2601fd0be8c1223111f55cf1ff94e6e /src/armnn/AsyncNetwork.hpp
parent: 23dbe3d3ff51c2b297ce5bf6360da6552f1c3bf5 (diff)
download: armnn-386ff1a721cdca3689b009ba31f2d3ac8bea2fae.tar.gz
1 files changed, 106 insertions, 0 deletions
diff --git a/src/armnn/AsyncNetwork.hpp b/src/armnn/AsyncNetwork.hpp
new file mode 100644
index 0000000000..9c525c5472
--- /dev/null
+++ b/src/armnn/AsyncNetwork.hpp
@@ -0,0 +1,106 @@
+//
+// Copyright © 2021 Arm Ltd and Contributors. All rights reserved.
+// SPDX-License-Identifier: MIT
+//
+
+#pragma once
+
+#include <armnn/IAsyncNetwork.hpp>
+#include <armnn/Tensor.hpp>
+#include <armnn/Types.hpp>
+
+#include "LayerFwd.hpp"
+#include "Network.hpp"
+#include "Profiling.hpp"
+#include "WorkingMemHandle.hpp"
+
+#include <armnn/backends/IBackendInternal.hpp>
+#include <backendsCommon/TensorHandleFactoryRegistry.hpp>
+#include <backendsCommon/Workload.hpp>
+#include <backendsCommon/WorkloadFactory.hpp>
+#include <ProfilingService.hpp>
+#include <TimelineUtilityMethods.hpp>
+
+#include <unordered_map>
+
+namespace armnn
+{
+
+namespace experimental
+{
+
+class AsyncNetwork final : public IAsyncNetwork
+{
+public:
+    using WorkloadQueue = std::vector<std::unique_ptr<IWorkload>>;
+
+    AsyncNetwork(std::unique_ptr<IOptimizedNetwork> net,
+                 const INetworkProperties &networkProperties,
+                 profiling::ProfilingService &profilingService);
+
+    ~AsyncNetwork() { FreeWorkingMemory(); }
+
+    TensorInfo GetInputTensorInfo(LayerBindingId layerId) const override;
+    TensorInfo GetOutputTensorInfo(LayerBindingId layerId) const override;
+
+    /// Thread safe execution of the network. Returns once execution is complete.
+    /// Will block until this and any other thread using the same workingMem object completes.
+    virtual Status Execute(const InputTensors& inputTensors,
+                           const OutputTensors& outputTensors,
+                           IWorkingMemHandle& workingMemHandle) override;
+
+    /// Create a new unique WorkingMemHandle object. Create multiple handles if you wish to have
+    /// overlapped Execution by calling this function from different threads.
+    std::unique_ptr<IWorkingMemHandle> CreateWorkingMemHandle() override;
+
+    /// Get the profiler used for this network
+    std::shared_ptr<IProfiler> GetProfiler() const override;
+
+    /// Register a debug callback function to be used with this network
+    void RegisterDebugCallback(const DebugCallbackFunction& func) override;
+
+private:
+    void FreeWorkingMemory();
+
+    void CollectInputTensorHandles(std::unordered_map<LayerGuid, std::vector<ITensorHandle*> >& tensorHandles,
+                                   std::vector<ITensorHandle*>& inputs,
+                                   const armnn::Layer* layer,
+                                   const TensorHandleFactoryRegistry& registry,
+                                   const bool isMemoryManaged = false);
+
+    void CreateOutputTensorHandles(std::unordered_map<LayerGuid, std::vector<ITensorHandle*> >& tensorHandles,
+                                   std::vector<ITensorHandle*>& outputs,
+                                   const armnn::Layer* layer,
+                                   const TensorHandleFactoryRegistry& registry,
+                                   const bool isMemoryManaged = false);
+
+    void EnqueueInput(const BindableLayer& layer, const ConstTensor& inputTensor, WorkingMemHandle& handle);
+
+    void EnqueueOutput(const BindableLayer& layer, const Tensor& outputTensor, WorkingMemHandle& handle);
+
+    using BackendPtrMap = std::unordered_map<BackendId, IBackendInternalUniquePtr>;
+
+    using WorkloadFactoryWithMemoryManager =
+            std::pair<IBackendInternal::IWorkloadFactoryPtr, IBackendInternal::IMemoryManagerSharedPtr>;
+
+    using WorkloadFactoryMap = std::unordered_map<BackendId, WorkloadFactoryWithMemoryManager>;
+
+    const IWorkloadFactory& GetWorkloadFactory(const Layer& layer) const;
+
+    BackendPtrMap m_Backends;
+    WorkloadFactoryMap m_WorkloadFactories;
+
+    std::unique_ptr<IOptimizedNetwork> m_OptimizedNetwork;
+    INetworkProperties m_NetworkProperties;
+    WorkloadQueue m_WorkloadQueue;
+    std::shared_ptr<IProfiler> m_Profiler;
+
+    TensorHandleFactoryRegistry m_TensorHandleFactoryRegistry;
+
+    /// Profiling Service Instance
+    profiling::ProfilingService& m_ProfilingService;
+};
+
+} // end experimental namespace
+
+} // end armnn namespace
author	Mike Kelly <mike.kelly@arm.com>	2021-03-29 15:04:50 +0100
committer	mike.kelly <mike.kelly@arm.com>	2021-03-29 14:03:30 +0000
commit	386ff1a721cdca3689b009ba31f2d3ac8bea2fae (patch)
tree	e2f5c26ab2601fd0be8c1223111f55cf1ff94e6e /src/armnn/AsyncNetwork.hpp
parent	23dbe3d3ff51c2b297ce5bf6360da6552f1c3bf5 (diff)
download	armnn-386ff1a721cdca3689b009ba31f2d3ac8bea2fae.tar.gz