plain/20.08/_network_8cpp_source.xhtml

 //
 // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 // SPDX-License-Identifier: MIT
 //

 #include "Network.hpp"
 #include "Graph.hpp"
 #include "Layer.hpp"
 #include "DeviceSpec.hpp"
 #include "Optimizer.hpp"
 #include "SubgraphViewSelector.hpp"
 #include "BackendSettings.hpp"
 #include "optimizations/All.hpp"

 #include <backendsCommon/CpuTensorHandle.hpp>
 #include <backendsCommon/WorkloadFactory.hpp>
 #include <armnn/backends/IBackendInternal.hpp>
 #include <backendsCommon/TensorHandleFactoryRegistry.hpp>

 #include <armnn/Exceptions.hpp>
 #include <armnn/Utils.hpp>
 #include <armnn/TypesUtils.hpp>
 #include <armnn/BackendRegistry.hpp>
 #include <armnn/Logging.hpp>
 #include <armnn/utility/Assert.hpp>
 #include <armnn/utility/IgnoreUnused.hpp>
 #include <armnn/utility/PolymorphicDowncast.hpp>

 #include <ProfilingService.hpp>

 #include <fcntl.h>
 #include <algorithm>
 #include <fstream>
 #include <memory>
 #include <vector>
 #include <algorithm>

 #include <boost/format.hpp>
 #include <boost/numeric/conversion/converter_policies.hpp>
 #include <boost/cast.hpp>

 namespace armnn
 {

 armnn::INetwork* INetwork::CreateRaw(NetworkOptions networkOptions)
 {
     return new Network(networkOptions);
 }

 armnn::INetworkPtr INetwork::Create(NetworkOptions networkOptions)
 {
     return INetworkPtr(CreateRaw(networkOptions), &INetwork::Destroy);
 }

 void INetwork::Destroy(INetwork* network)
 {
     delete PolymorphicDowncast<Network*>(network);
 }

 void IOptimizedNetwork::Destroy(IOptimizedNetwork* network)
 {
     delete PolymorphicDowncast<OptimizedNetwork*>(network);
 }

 Status OptimizedNetwork::PrintGraph()
 {
     m_Graph->Print();
     return Status::Success;
 }

 Status OptimizedNetwork::SerializeToDot(std::ostream& stream) const
 {
     return m_Graph->SerializeToDot(stream);
 }

 void ReportError(const std::string& errorMessage,
                  Optional<std::vector<std::string>&> errorMessages)
 {
     std::stringstream fullErrorMessage;
     fullErrorMessage << "ERROR: " << errorMessage;
     ARMNN_LOG(warning) << fullErrorMessage.str();
     if (errorMessages)
     {
         errorMessages.value().push_back(fullErrorMessage.str());
     }
 }

 void ReportWarning(const std::string& warningMessage,
                    Optional<std::vector<std::string>&> warningMessages)
 {
     std::stringstream fullWarningMessage;
     fullWarningMessage << "WARNING: " << warningMessage;
     ARMNN_LOG(warning) << fullWarningMessage.str();
     if (warningMessages)
     {
         warningMessages.value().push_back(fullWarningMessage.str());
     }
 }

 OptimizationResult ReturnWithError(OptimizationResult res,
                                    const Layer* layer,
                                    const BackendSettings& backendSettings,
                                    Optional<std::vector<std::string>&> errMessages)
 {
     std::stringstream failureMsg;
     failureMsg << "Layer of type " << GetLayerTypeAsCString(layer->GetType())
                << " is not supported on any preferred backend " << backendSettings.m_PreferredBackends;
     ReportError(failureMsg.str(), errMessages);

     res.m_Error = true;
     return res;
 }


 bool CheckScaleSetOnQuantizedType(Layer* layer, Optional<std::vector<std::string>&> errMessages)
 {
     bool noErrors = true;
     unsigned int numOutputs = layer->GetNumOutputSlots();
     for (unsigned int i = 0; i < numOutputs; i++) {
         OutputSlot& outputSlot = layer->GetOutputSlot(i);
         TensorInfo info = outputSlot.GetTensorInfo();
         if (DataType::QAsymmU8 == info.GetDataType()) {
             if (0.f == info.GetQuantizationScale()) {
                 noErrors = false;
                 std::stringstream ss;
                 ss << "output " << i << " of layer " << GetLayerTypeAsCString(layer->GetType())
                    << " (" << layer->GetNameStr() << ") is of type"
                    << " Quantized 8 bit but its scale parameter has not been set";
                 ReportError(ss.str(), errMessages);
             }
             // Softmax under QuantisedAsymm8 must always be scale (1.0f/256.0f) and offset 0
             if ((info.GetQuantizationScale() != (1.0f / 256.0f) ||
                  info.GetQuantizationOffset() != 0) &&
                  layer->GetType() == armnn::LayerType::Softmax)
             {
                 std::stringstream ss;
                 ss << "Quantization parameters for Softmax layer (Scale: " <<
                 info.GetQuantizationScale() << " and Offset: " << info.GetQuantizationOffset() <<
                 ") are incorrect and have been updated to Scale: 0.00390625 and Offset: 0";
                 ARMNN_LOG(warning) << ss.str();
                 info.SetQuantizationScale((1.0f /256.0f));
                 info.SetQuantizationOffset(0);
                 outputSlot.SetTensorInfo(info);
             }
         }
     }
     return noErrors;
 }

 template <typename LayerT>
 LayerT* ConvertBf16ToFp32Weight(Layer* l)
 {
     LayerT* layer = PolymorphicDowncast<LayerT*>(l);
     if ((layer->GetType() == LayerType::Convolution2d || layer->GetType() == LayerType::FullyConnected)
          && layer->m_Weight)
     {
         const TensorInfo& info = layer->m_Weight->GetTensorInfo();

         if (info.GetDataType() == DataType::BFloat16)
         {
             std::vector<float> newValues(info.GetNumElements());

             armnnUtils::FloatingPointConverter::ConvertBFloat16ToFloat32(
                 layer->m_Weight->template GetTensor<armnn::BFloat16>(), info.GetNumElements(), newValues.data());

             TensorInfo newInfo(info.GetShape(), DataType::Float32);
             ConstTensor newInput(newInfo, newValues);
             layer->m_Weight.reset(new ScopedCpuTensorHandle(newInput));
         }
     }
     return layer;
 }

 OptimizationResult AttemptBackendAssignment(BackendSettings& backendSettings,
                                             Graph& graph,
                                             Layer* layer,
                                             BackendId backend,
                                             DataType dataTypeIn,
                                             DataType dataTypeOut,
                                             const std::vector<BackendId>& availablePreferredBackends,
                                             std::string& reasonIfUnsupported,
                                             Optional<std::vector<std::string>&> errMessages)
 {
     OptimizationResult result;

     // Helper lambda to compose meaningful error message before returning with error
     auto ReturnError = [&](const Layer* layer)
         {
             return ReturnWithError(result, layer, backendSettings, errMessages);
         };

     // need to set the compute device on the layer
     // before we can check if it is supported
     layer->SetBackendId(backend);
     if (!IWorkloadFactory::IsLayerSupported(*layer, EmptyOptional(), reasonIfUnsupported))
     {
         if (dataTypeIn == DataType::Float16 || dataTypeOut == DataType::Float16)
         {
             if (IWorkloadFactory::IsLayerSupported(*layer, DataType::Float32, reasonIfUnsupported)
                 && layer->GetType() != LayerType::ConvertFp32ToFp16
                 && layer->GetType() != LayerType::ConvertFp16ToFp32)
             {
                 // Insert FP16 -> FP32 conversion layer before current layer
                 std::vector<ConvertFp16ToFp32Layer*> convertFp16ToFp32Layers;
                 if (dataTypeIn == DataType::Float16)
                 {
                     convertFp16ToFp32Layers =
                         InsertConvertFp16ToFp32LayersBefore(graph, *layer);
                 }

                 // Insert FP32 -> FP16 conversion layer after current layer
                 std::vector<ConvertFp32ToFp16Layer*> convertFp32ToFp16Layers;
                 if (dataTypeOut == DataType::Float16)
                 {
                     convertFp32ToFp16Layers =
                         InsertConvertFp32ToFp16LayersAfter(graph, *layer);
                 }

                 // Assign a supported backend to the newly introduced conversion layers
                 auto AssignFirstSupportedBackend = [&](Layer* layer, BackendId preferredBackend)
                     {
                         bool supportedBackendFound = false;
                         std::string reasonIfUnsupported;

                         // Try preferred backend first
                         layer->SetBackendId(preferredBackend);
                         if (IWorkloadFactory::IsLayerSupported(*layer,
                                                                EmptyOptional(),
                                                                reasonIfUnsupported))
                         {
                             supportedBackendFound = true;
                         }
                         else
                         {
                             for (const auto& backend : availablePreferredBackends)
                             {
                                 // Skip preferred backend (we already determined that it is not supported)
                                 if (backend == preferredBackend)
                                 {
                                     continue;
                                 }

                                 layer->SetBackendId(backend);
                                 if (IWorkloadFactory::IsLayerSupported(*layer,
                                                                        EmptyOptional(),
                                                                        reasonIfUnsupported))
                                 {
                                     supportedBackendFound = true;
                                     break;
                                 }
                             }
                         }

                         return supportedBackendFound;
                     };

                 for (ConvertFp16ToFp32Layer* convertLayer : convertFp16ToFp32Layers)
                 {
                     if (!AssignFirstSupportedBackend(convertLayer, backend))
                     {
                         return ReturnError(convertLayer);
                     }
                 }

                 for (ConvertFp32ToFp16Layer* convertLayer : convertFp32ToFp16Layers)
                 {
                     if (!AssignFirstSupportedBackend(convertLayer, backend))
                     {
                         return ReturnError(convertLayer);
                     }
                 }

                 return result;
             }
         }
         else if (dataTypeIn == DataType::BFloat16 || dataTypeOut == DataType::BFloat16)
         {
             if (IWorkloadFactory::IsLayerSupported(*layer, DataType::Float32, reasonIfUnsupported)
                 && layer->GetType() != LayerType::ConvertFp32ToBf16
                 && layer->GetType() != LayerType::ConvertBf16ToFp32)
             {
                 // Insert BF16 -> FP32 conversion layer before current layer
                 std::vector<ConvertBf16ToFp32Layer*> convertBf16ToFp32Layers;
                 if (dataTypeIn == DataType::BFloat16)
                 {
                     convertBf16ToFp32Layers =
                         InsertConvertBf16ToFp32LayersBefore(graph, *layer);
                     if (layer->GetType() == LayerType::Convolution2d)
                     {
                         ConvertBf16ToFp32Weight<Convolution2dLayer>(layer);
                     }
                     else if (layer->GetType() == LayerType::FullyConnected)
                     {
                         ConvertBf16ToFp32Weight<FullyConnectedLayer>(layer);
                     }
                 }

                 // Insert FP32 -> BF16 conversion layer after current layer
                 std::vector<ConvertFp32ToBf16Layer*> convertFp32ToBf16Layers;
                 if (dataTypeOut == DataType::BFloat16)
                 {
                     convertFp32ToBf16Layers =
                         InsertConvertFp32ToBf16LayersAfter(graph, *layer);
                 }

                 // Assign a supported backend to the newly introduced conversion layers
                 auto AssignFirstSupportedBackend = [&](Layer* layer, BackendId preferredBackend)
                     {
                         bool supportedBackendFound = false;
                         std::string reasonIfUnsupported;

                         // Try preferred backend first
                         layer->SetBackendId(preferredBackend);
                         if (IWorkloadFactory::IsLayerSupported(*layer,
                                                                EmptyOptional(),
                                                                reasonIfUnsupported))
                         {
                             supportedBackendFound = true;
                         }
                         else
                         {
                             for (const auto& backend : availablePreferredBackends)
                             {
                                 // Skip preferred backend (we already determined that it is not supported)
                                 if (backend == preferredBackend)
                                 {
                                     continue;
                                 }

                                 layer->SetBackendId(backend);
                                 if (IWorkloadFactory::IsLayerSupported(*layer,
                                                                        EmptyOptional(),
                                                                        reasonIfUnsupported))
                                 {
                                     supportedBackendFound = true;
                                     break;
                                 }
                             }
                         }

                         return supportedBackendFound;
                     };

                 for (ConvertBf16ToFp32Layer* convertLayer : convertBf16ToFp32Layers)
                 {
                     if (!AssignFirstSupportedBackend(convertLayer, backend))
                     {
                         return ReturnError(convertLayer);
                     }
                 }

                 for (ConvertFp32ToBf16Layer* convertLayer : convertFp32ToBf16Layers)
                 {
                     if (!AssignFirstSupportedBackend(convertLayer, backend))
                     {
                         return ReturnError(convertLayer);
                     }
                 }

                 return result;
             }
         }

         std::stringstream warningMsg;
         warningMsg << "Layer of type " << GetLayerTypeAsCString(layer->GetType())
                    << " is not supported on requested backend " << layer->GetBackendId().Get()
                    << " for input data type " << GetDataTypeName(dataTypeIn)
                    << " and output data type " << GetDataTypeName(dataTypeOut)
                    << " (reason: " << reasonIfUnsupported
                    << "), falling back to the next backend.";
         ReportWarning(warningMsg.str(), errMessages);

         return OptimizationResult(true, false);
     }
     else
     {
         return result;
     }
 }


 OptimizationResult AssignBackends(OptimizedNetwork* optNetObjPtr,
                                   BackendSettings& backendSettings,
                                   Graph::Iterator& firstLayer,
                                   Graph::Iterator& lastLayer,
                                   Optional<std::vector<std::string>&> errMessages)
 {
     OptimizationResult result;

     // Helper lambda to compose meaningful error message before returning with error
     auto ReturnError = [&](const Layer* layer)
         {
             return ReturnWithError(result, layer, backendSettings, errMessages);
         };


     auto availablePreferredBackends = backendSettings.GetAvailablePreferredBackends();
     if (availablePreferredBackends.empty())
     {
         std::stringstream failureMsg;
         failureMsg << "No preferred backends are available";
         ReportError(failureMsg.str(), errMessages);

         result.m_Error = true;
         return result;
     }

     for (auto it = firstLayer; it != lastLayer; ++it)
     {
         auto layer = *it;

         DataType dataTypeIn  = layer->GetNumInputSlots() == 0 ? DataType::Float32 :
             layer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo().GetDataType();
         DataType dataTypeOut = layer->GetNumOutputSlots() == 0 ? DataType::Float32 :
             layer->GetOutputSlot(0).GetTensorInfo().GetDataType();

         std::string reasonIfUnsupported;
         bool found = false;
         if (!CheckScaleSetOnQuantizedType(layer, errMessages))
         {
             // don't bomb immediately, find all the quantized outputs
             // which haven't had a scale set and report them all back.
             result.m_Error = true;
         }

         // First try assign layer to hint backend
         if (layer->GetBackendHint().has_value() &&
             backendSettings.IsBackendSupported(layer->GetBackendHint().value()) &&
             AttemptBackendAssignment(backendSettings,
                                      optNetObjPtr->GetGraph(),
                                      layer,
                                      layer->GetBackendHint().value(),
                                      dataTypeIn,
                                      dataTypeOut,
                                      availablePreferredBackends,
                                      reasonIfUnsupported,
                                      errMessages).IsOk())
         {
             found = true;
             backendSettings.m_SelectedBackends.insert(layer->GetBackendHint().value());
         }
         else
         {
             // Try assign layer to prefered list of backends
             for (const auto& backend : availablePreferredBackends)
             {
                 if (layer->GetBackendHint().has_value() &&
                     layer->GetBackendHint().value() == backend)
                 {
                     continue; //Don't re-test the backend hint
                 }

                 OptimizationResult res = AttemptBackendAssignment(backendSettings,
                                                                   optNetObjPtr->GetGraph(),
                                                                   layer,
                                                                   backend,
                                                                   dataTypeIn,
                                                                   dataTypeOut,
                                                                   availablePreferredBackends,
                                                                   reasonIfUnsupported,
                                                                   errMessages);

                 if (res.IsOk())
                 {
                     found = true;
                     backendSettings.m_SelectedBackends.insert(backend);
                     break;
                 }
                 else if (res.IsError())
                 {
                    return res;  // Cannot continue.
                    // Note: we don't need to log the error as it would already
                    // be logged in AttemptBackendAssignment().
                 }
                 else
                 {
                     ARMNN_ASSERT_MSG(res.IsWarningOnly(), "OptimizationResult in unexpected state.");
                 }
             }
         }

         // If the layer is unsupported by any devices, log and return a null network.
         if (!found)
         {
             // NOTE: if the layer is not an operation queue type AND we have not got CpuRef as a
             //       fallback we should set the compute device on the layer to CpuRef (these are not
             //       available as accelerated operations, or are only available under certain
             //       conditions, currently they comprise MemCopy, Constant, Permute)
             armnn::LayerType layerType = layer->GetType();
             if (!backendSettings.IsCpuRefUsed() && (layerType == armnn::LayerType::MemCopy ||
                                                     layerType == armnn::LayerType::Constant ||
                                                     layerType == armnn::LayerType::Permute))
             {
                 BackendId cpuBackendId(armnn::Compute::CpuRef);
                 layer->SetBackendId(cpuBackendId);
                 backendSettings.m_SelectedBackends.insert(cpuBackendId);
             }
             else
             {
                 return ReturnError(layer);
             }
         }
     }

     return result;
 }

 OptimizationResult AssignBackends(OptimizedNetwork* optNetObjPtr,
                                   BackendSettings& backendSettings,
                                   SubgraphView& subgraph,
                                   Optional<std::vector<std::string>&> errMessages)
 {
     Graph::Iterator firstLayer = subgraph.begin();
     Graph::Iterator lastLayer  = subgraph.end();
     return AssignBackends(optNetObjPtr,
                           backendSettings,
                           firstLayer,
                           lastLayer,
                           errMessages);
 }

 BackendsMap CreateSupportedBackends(TensorHandleFactoryRegistry& handleFactoryRegistry,
                                     BackendSettings& backendSettings)
 {
     BackendsMap backends;
     auto const& backendRegistry = BackendRegistryInstance();
     for (auto&& selectedBackend : backendSettings.m_SupportedBackends)
     {
         auto backendFactory = backendRegistry.GetFactory(selectedBackend);
         auto backendObjPtr = backendFactory();
         ARMNN_ASSERT(backendObjPtr);

         backendObjPtr->RegisterTensorHandleFactories(handleFactoryRegistry);

         backends[backendObjPtr->GetId()] = std::move(backendObjPtr);
     }

     return backends;
 }

 OptimizationResult ApplyBackendOptimizations(OptimizedNetwork* optNetObjPtr,
                                              BackendSettings& backendSettings,
                                              BackendsMap& backends,
                                              Optional<std::vector<std::string>&> errMessages)
 {
     ARMNN_ASSERT(optNetObjPtr);

     OptimizationResult result;

     // Get the optimized graph
     Graph& optGraph = optNetObjPtr->GetGraph();

     // Run backend specific optimizations
     for (auto&& selectedBackend : backendSettings.m_SelectedBackends)
     {
         auto backendObjPtr = backends.find(selectedBackend)->second.get();
         ARMNN_ASSERT(backendObjPtr);

         // Select sub-graphs based on backend
         SubgraphViewSelector::Subgraphs subgraphs =
                 SubgraphViewSelector::SelectSubgraphs(optGraph,
                                                       // Select layers assigned to the requested backend
                                                       [&backendObjPtr](const Layer& layer)
                                                       {
                                                           return layer.GetType() != LayerType::Input &&
                                                                  layer.GetType() != LayerType::Output &&
                                                                  layer.GetBackendId() == backendObjPtr->GetId();
                                                       });
         if (subgraphs.empty())
         {
             // No sub-graphs found, try with next selected backend
             continue;
         }

         // Try to optimize each sub-graph
         for (auto& subgraph : subgraphs)
         {
             // Try to optimize the current sub-graph
             OptimizationViews optimizationViews = backendObjPtr->OptimizeSubgraphView(*subgraph);
             ARMNN_ASSERT(optimizationViews.Validate(*subgraph));

             // Optimization attempted, check the resulting optimized sub-graph
             for (auto& substitution : optimizationViews.GetSubstitutions())
             {
                 // Sub-graph optimized, substitute the sub-graph with the new optimized one in the main optimized graph
                 SubgraphView& replacementSubgraph   = substitution.m_ReplacementSubgraph;
                 SubgraphView& substitutableSubgraph = substitution.m_SubstitutableSubgraph;
                 optGraph.SubstituteSubgraph(substitutableSubgraph, replacementSubgraph);

                 // Assign the current backend to the optimized sub-graph
                 std::for_each(replacementSubgraph.begin(), replacementSubgraph.end(), [&selectedBackend](Layer* l)
                     {
                         ARMNN_ASSERT(l);
                         l->SetBackendId(selectedBackend);
                     });
             }

             if (!optimizationViews.GetFailedSubgraphs().empty())
             {
                 std::stringstream warningMsg;
                 warningMsg << "Some sub-graph(s) failed to optimized on " << backendObjPtr->GetId() << " backend.";
                 ReportWarning(warningMsg.str(), errMessages);

                 // Failed to optimize the given sub-graph, re-assign the sub-graph layers to other available backends
                 BackendSettings settingsCopy(backendSettings);
                 if (!backendObjPtr->GetId().IsCpuRef())
                 {
                     // Add the current backend to the list of backends to ignore
                     settingsCopy.m_IgnoredBackends.insert(backendObjPtr->GetId());
                 }

                 int count=0;
                 for (auto& failedSubgraph : optimizationViews.GetFailedSubgraphs())
                 {
                     // An error occurred: the optimization was attempted but not performed, try different backends
                     std::stringstream subgraphMsg;
                     subgraphMsg << "Re-assigning backends to " << failedSubgraph.GetLayers().size()
                                 << " layers inside sub-graph " << count++;
                     ReportWarning(subgraphMsg.str(), errMessages);

                     OptimizationResult reassignmentResult = AssignBackends(optNetObjPtr,
                                                                            settingsCopy,
                                                                            *subgraph,
                                                                            errMessages);
                     if (reassignmentResult.m_Error)
                     {
                         // Failed to re-assign one of the remaining backends to each layer of the sub-graph
                         result.m_Error = true;
                         return result;
                     }
                 }
             }
         }
     }

     return result;
 }

 bool RequiresCopy(ITensorHandleFactory::FactoryId src,
                   ITensorHandleFactory::FactoryId dst,
                   TensorHandleFactoryRegistry& registry)
 {
     if (src != dst)
     {
         ITensorHandleFactory* srcFactory = registry.GetFactory(src);
         ITensorHandleFactory* dstFactory = registry.GetFactory(dst);

         if (srcFactory && dstFactory &&
             (srcFactory->GetExportFlags() & dstFactory->GetImportFlags()) != 0)
         {
             return false;
         }
         return true;
     }
     return false;
 }

 // Find the handle factory for the input layer which results in fewest required copies.
 ITensorHandleFactory::FactoryId CalculateSlotOptionForInput(BackendsMap& backends,
                                                             OutputSlot& slot,
                                                             TensorHandleFactoryRegistry& registry)
 {
     Layer& layer = slot.GetOwningLayer();
     ARMNN_ASSERT(layer.GetType() == LayerType::Input);

     // Explicitly select the tensorhandle factory for InputLayer because the rules for it are slightly different. It
     // doesn't matter which backend it is assigned to because they all use the same implementation, which
     // requires Map/Unmap support. This means that, so long as the handle type supports map/unmap semantics, we can
     // select a factory with maximum compatibility with the layers connected to the InputLayer.

     // First ensure the from backends can support the TensorHandeAPI
     auto frmBackend = backends.find(layer.GetBackendId());
     if (frmBackend == backends.end() ||
         !frmBackend->second->SupportsTensorAllocatorAPI())
     {
         return ITensorHandleFactory::LegacyFactoryId;
     }

     // Go through all connections to the output slot and determine the TensorHandleFactory which results in the
     // fewest copies.
     std::map<ITensorHandleFactory::FactoryId, int> factoryScores;
     int topScore = 0;
     ITensorHandleFactory::FactoryId topChoice = ITensorHandleFactory::LegacyFactoryId;

     for (auto&& connection : slot.GetConnections())
     {
         const Layer& connectedLayer = connection->GetOwningLayer();

         auto toBackend = backends.find(connectedLayer.GetBackendId());
         ARMNN_ASSERT_MSG(toBackend != backends.end(), "Backend id not found for the connected layer");

         if (!toBackend->second.get()->SupportsTensorAllocatorAPI())
         {
             // The destination backend does not support the tensor allocator API, move to the next one
             continue;
         }

         auto dstPrefs = toBackend->second.get()->GetHandleFactoryPreferences();
         for (auto&& dst : dstPrefs)
         {
             // Input layers use the mem copy workload or import, so the selected factory must
             // support either the map/unmap API or Import API
             ITensorHandleFactory* factory = registry.GetFactory(dst);
             if (!factory->SupportsMapUnmap() &&
                 !CheckFlag(factory->GetImportFlags(), MemorySource::Malloc)) // Just support cpu mem imports for now
             {
                 // The current tensor handle factory does not support the map/unmap or import
                 // strategy, move to the next one
                 continue;
             }

             auto it = factoryScores.find(dst);
             if (it == factoryScores.end())
             {
                 // Add new score to the table
                 factoryScores[dst] = 0;
                 if (topChoice == ITensorHandleFactory::LegacyFactoryId)
                 {
                     topChoice = dst;
                 }
             }
             else
             {
                 // Increase the score
                 factoryScores[dst]++;

                 // Track the best option
                 if (factoryScores[dst] > topScore)
                 {
                     topScore = factoryScores[dst];
                     topChoice = dst;
                 }
             }
         }
     }

     return topChoice;
 }

 // Find the handle factory for the output layer which results in fewest required copies.
 ITensorHandleFactory::FactoryId CalculateSlotOptionForOutput(BackendsMap& backends,
                                                             OutputSlot& slot,
                                                             TensorHandleFactoryRegistry& registry)
 {
     IgnoreUnused(backends, slot, registry);
     return ITensorHandleFactory::DeferredFactoryId;
 }

 // For all handle factories supported on the source backend, we wish to find the one which requires the fewest copies
 // when considering all connections.
 ITensorHandleFactory::FactoryId CalculateSlotOption(BackendsMap& backends,
                                                     OutputSlot& outputSlot,
                                                     TensorHandleFactoryRegistry& registry)
 {
     // First ensure the from backends can support the TensorHandeAPI
     Layer& layer = outputSlot.GetOwningLayer();
     auto frmBackend = backends.find(layer.GetBackendId());
     if (frmBackend == backends.end() ||
         !frmBackend->second->SupportsTensorAllocatorAPI())
     {
         return ITensorHandleFactory::LegacyFactoryId;
     }

     // Connections to Output Layers requires support for map/unmap on the TensorHandle.
     bool requiresMapUnmap = false;
     for (auto&& connection : outputSlot.GetConnections())
     {
         const Layer& connectedLayer = connection->GetOwningLayer();
         if (connectedLayer.GetType() == LayerType::Output)
         {
             requiresMapUnmap = true;
         }
     }

     IBackendInternal* srcBackend = frmBackend->second.get();
     auto srcPrefs = srcBackend->GetHandleFactoryPreferences();

     // Initialize the scores
     std::map<ITensorHandleFactory::FactoryId, int> factoryScores;
     for (auto&& pref : srcPrefs)
     {
         if (requiresMapUnmap) // Only consider factories that support map/unmap if required
         {
             ITensorHandleFactory* factory = registry.GetFactory(pref);
             if (!factory->SupportsMapUnmap())
             {
                 // The current tensor handle factory does not support the map/unmap strategy, move to the next one
                 continue;
             }
         }

         auto it = factoryScores.find(pref);
         if (it == factoryScores.end())
         {
             // Add new score to the table
             factoryScores[pref] = 0;
         }
     }

     // Score each handle factory based on how many times it requires copies on the slot connections
     for (auto&& connection : outputSlot.GetConnections())
     {
         const Layer& connectedLayer = connection->GetOwningLayer();

         auto toBackend = backends.find(connectedLayer.GetBackendId());
         ARMNN_ASSERT_MSG(toBackend != backends.end(), "Backend id not found for the connected layer");

         auto dstPrefs = toBackend->second.get()->GetHandleFactoryPreferences();
         for (auto&& src : srcPrefs)
         {
             if (factoryScores.find(src) == factoryScores.end()) // Don't consider excluded factories
             {
                 continue;
             }

             for (auto&& dst : dstPrefs)
             {
                 if (RequiresCopy(src, dst, registry))
                 {
                     // Copy avoided, increase the score
                     factoryScores[src]++;
                     break;
                 }
             }
         }
     }

     // Find the lowest score
     int minScore = std::numeric_limits<int>::max();
     for (auto it : factoryScores)
     {
         minScore = std::min(minScore, it.second);
     }

     // Collect factories matching the best(lowest) score
     std::vector<ITensorHandleFactory::FactoryId> optimalFactories;
     for (auto it : factoryScores)
     {
         if (it.second == minScore)
         {
             optimalFactories.push_back(it.first);
         }
     }

     // For all compatible Factories matching the best score, find the preferred one for the current layer.
     for (auto&& srcPref : srcPrefs)
     {
         for (auto&& comp : optimalFactories)
         {
             if (comp == srcPref)
             {
                 return comp;
             }
         }
     }

     return ITensorHandleFactory::LegacyFactoryId;
 }

 EdgeStrategy CalculateEdgeStrategy(BackendsMap& backends,
                                    ITensorHandleFactory::FactoryId srcFactoryId,
                                    const Layer& layer,
                                    const Layer& connectedLayer,
                                    TensorHandleFactoryRegistry& registry,
                                    bool importEnabled)
 {
     auto toBackend = backends.find(connectedLayer.GetBackendId());
     ARMNN_ASSERT_MSG(toBackend != backends.end(), "Backend id not found for the connected layer");

     auto dstPrefs = toBackend->second.get()->GetHandleFactoryPreferences();

     // Legacy API check for backward compatibility
     if (srcFactoryId == ITensorHandleFactory::LegacyFactoryId || dstPrefs.empty())
     {
         if (layer.GetBackendId() != connectedLayer.GetBackendId())
         {
             return EdgeStrategy::CopyToTarget;
         }
         else
         {
             return EdgeStrategy::DirectCompatibility;
         }
     }

     // TensorHandleFactory API present, so perform more sophisticated strategies.
     // Dst Output layers don't require copy because they use import or map/unmap
     if (connectedLayer.GetType() == LayerType::Output)
     {
         return EdgeStrategy::DirectCompatibility;
     }

     // Search for direct match in prefs
     for (auto&& pref : dstPrefs)
     {
         if (pref == srcFactoryId)
         {
             return EdgeStrategy::DirectCompatibility;
         }
     }

     // Search for export/import options
     ITensorHandleFactory* srcFactory = registry.GetFactory(srcFactoryId);
     if (srcFactory->GetExportFlags() != 0 && importEnabled)
     {
         for (auto&& pref : dstPrefs)
         {
             ITensorHandleFactory* dstFactory = registry.GetFactory(pref);

             // Handles cases when a destPref is not listed in TensorHandleFactoryRegistry
             if (!dstFactory) {
                 continue;
             }

             if ((dstFactory->GetImportFlags() & srcFactory->GetExportFlags()) != 0)
             {
                 auto srcCapability = srcFactory->GetCapabilities(&layer, &layer, CapabilityClass::PaddingRequired);
                 auto dstCapability = dstFactory->GetCapabilities(&connectedLayer,
                                                                  &connectedLayer,
                                                                  CapabilityClass::PaddingRequired);
                 // Do not require memory copy if the source and destination do not require padding.
                 if (srcCapability.empty() && dstCapability.empty())
                 {
                     return EdgeStrategy::ExportToTarget;
                 }
             }
         }
     }

     // Search for copy options via map/unmap
     if (srcFactory->SupportsMapUnmap())
     {
         for (auto&& pref : dstPrefs)
         {
             ITensorHandleFactory* dstFactory = registry.GetFactory(pref);
             if (dstFactory && dstFactory->SupportsMapUnmap())
             {
                 return EdgeStrategy::CopyToTarget;
             }
         }
     }

     return EdgeStrategy::Undefined;
 }

 // Select the TensorHandleFactories and the corresponding memory strategy
 OptimizationResult SelectTensorHandleStrategy(Graph& optGraph,
                                               BackendsMap& backends,
                                               TensorHandleFactoryRegistry& registry,
                                               bool importEnabled,
                                               Optional<std::vector<std::string>&> errMessages)
 {
     OptimizationResult result;

     optGraph.ForEachLayer([&backends, &registry, &result, &errMessages, importEnabled](Layer* layer)
     {
         ARMNN_ASSERT(layer);

         // Lets make sure the backend is in our list of supported backends. Something went wrong during backend
         // assignment if this check fails
         ARMNN_ASSERT(backends.find(layer->GetBackendId()) != backends.end());

         // Check each output separately
         for (unsigned int slotIdx = 0; slotIdx < layer->GetNumOutputSlots(); slotIdx++)
         {
             OutputSlot& outputSlot = layer->GetOutputSlot(slotIdx);

             ITensorHandleFactory::FactoryId slotOption = ITensorHandleFactory::LegacyFactoryId;

             // Calculate the factory to use which results in the fewest copies being made.
             switch(layer->GetType())
             {
                 case LayerType::Input:
                     slotOption = CalculateSlotOptionForInput(backends, outputSlot, registry);
                     break;
                 case LayerType::Output:
                     slotOption = CalculateSlotOptionForOutput(backends, outputSlot, registry);
                     break;
                 default:
                     slotOption = CalculateSlotOption(backends, outputSlot, registry);
                     break;
             }
             outputSlot.SetTensorHandleFactory(slotOption);

             // Now determine the "best" edge strategy for each connection given the slotOption.
             unsigned int connectionIdx = 0;
             for (auto&& connection : outputSlot.GetConnections())
             {
                 const Layer& connectedLayer = connection->GetOwningLayer();

                 EdgeStrategy strategy = CalculateEdgeStrategy(backends, slotOption, *layer, connectedLayer,
                                                               registry, importEnabled);

                 if (strategy == EdgeStrategy::Undefined)
                 {
                     result.m_Error = true;
                     if (errMessages)
                     {
                         errMessages.value().emplace_back("Could not find valid strategy required for compatibility"
                                                          " between backends.");
                     }
                     return;
                 }

                 outputSlot.SetEdgeStrategy(connectionIdx, strategy);

                 connectionIdx++;
             }
         }
     });

     return result;
 }

 IOptimizedNetworkPtr Optimize(const INetwork& inNetwork,
                               const std::vector<BackendId>& backendPreferences,
                               const IDeviceSpec& deviceSpec,
                               const OptimizerOptions& options,
                               Optional<std::vector<std::string>&> messages)
 {
     if (backendPreferences.empty())
     {
         throw armnn::InvalidArgumentException("Invoked Optimize with no backends specified");
     }

     if (options.m_ReduceFp32ToFp16 && options.m_ReduceFp32ToBf16)
     {
         throw InvalidArgumentException("BFloat16 and Float16 optimization cannot be enabled at the same time.");
     }

     const Network& network = *PolymorphicDowncast<const Network*>(&inNetwork);
     std::unique_ptr<Graph> graph = std::make_unique<Graph>(network.GetGraph());

     auto optNet = IOptimizedNetworkPtr(new OptimizedNetwork(std::move(graph)), &IOptimizedNetwork::Destroy);

     OptimizedNetwork* optNetObjPtr = PolymorphicDowncast<OptimizedNetwork*>(optNet.get());

     // Get the optimized graph
     Graph& optGraph = optNetObjPtr->GetGraph();

     // Perform optimisation passes
     using namespace optimizations;
     Optimizer::Pass(optGraph, MakeOptimizations(SquashEqualPermuteSiblings(),
                                                 SquashEqualTransposeSiblings(),
                                                 SquashEqualReshapeSiblings(),
                                                 OptimizeInversePermutes(),
                                                 OptimizeInverseTransposes(),
                                                 MovePermuteUp(),
                                                 MoveTransposeUp(),
                                                 PermuteAsReshape(),
                                                 TransposeAsReshape(),
                                                 OptimizeConsecutiveReshapes(),
                                                 FoldPadIntoConvolution2d(),
                                                 PermuteAndBatchToSpaceAsDepthToSpace(),
                                                 TransposeAndBatchToSpaceAsDepthToSpace()));

     // Infer the tensor infos for all output slots. Throws an exception on failure
     optGraph.InferTensorInfos();

     // If Fp32 to Fp16 optimization is set convert Fp32 network to Fp16
     if (options.m_ReduceFp32ToFp16)
     {
         Optimizer::Pass(optGraph, MakeOptimizations(Fp32NetworkToFp16Converter()));
         Optimizer::Pass(optGraph, MakeOptimizations(ConvertConstantsFloatToHalf()));
     }

     // If Fp32 to Bf16 optimization is set convert Fp32 network to Bf16
     // Convert input of Convolution2d and FullyConnected from Fp32 to Bf16
     // Only Constant weight of Convolution2d and FullyConnected are converted from Fp32 to Bf16
     if (options.m_ReduceFp32ToBf16)
     {
         Optimizer::Pass(optGraph, MakeOptimizations(Fp32NetworkToBf16Converter()));
     }

     // Initialize backend settings
     BackendSettings backendSettings(backendPreferences, deviceSpec);
     if (backendSettings.GetAvailablePreferredBackends().empty())
     {
         std::stringstream failureMsg;
         failureMsg << "None of the preferred backends " << backendPreferences
                    << " are supported. Current platform provides " << backendSettings.m_SupportedBackends;
         ReportError(failureMsg.str(), messages);
         return IOptimizedNetworkPtr(nullptr, &IOptimizedNetwork::Destroy);
     }

     // Create a map to temporarily hold initialized backend objects
     TensorHandleFactoryRegistry tensorHandleFactoryRegistry;
     BackendsMap backends = CreateSupportedBackends(tensorHandleFactoryRegistry, backendSettings);

     // Assign an available backend to each layer
     Graph::Iterator firstLayer = optGraph.begin();
     Graph::Iterator lastLayer  = optGraph.end();
     OptimizationResult assignBackendsResult = AssignBackends(optNetObjPtr,
                                                              backendSettings,
                                                              firstLayer,
                                                              lastLayer,
                                                              messages);
     if (assignBackendsResult.m_Error)
     {
         // Failed to assign a backend to each layer
         return IOptimizedNetworkPtr(nullptr, &IOptimizedNetwork::Destroy);
     }

     Optimizer::Pass(optGraph, MakeOptimizations(OptimizeInverseConversionsFp16(),
                                                 OptimizeInverseConversionsFp32()));

     // Apply the backend-specific optimizations
     OptimizationResult backendOptimizationResult = ApplyBackendOptimizations(optNetObjPtr,
                                                                              backendSettings,
                                                                              backends,
                                                                              messages);
     if (backendOptimizationResult.m_Error)
     {
         // Failed to apply the backend-specific optimizations
         return IOptimizedNetworkPtr(nullptr, &IOptimizedNetwork::Destroy);
     }

     // If the debug flag is set, then insert a DebugLayer after each layer
     // Doing this after applying the backend optimizations as they might have changed some layers
     if (options.m_Debug)
     {
         Optimizer::Pass(optGraph, MakeOptimizations(InsertDebugLayer()));
     }

     // Calculate the compatibility strategies for tensor handles
     OptimizationResult strategyResult = SelectTensorHandleStrategy(optGraph,
                                                                    backends,
                                                                    tensorHandleFactoryRegistry,
                                                                    options.m_ImportEnabled,
                                                                    messages);
     if (strategyResult.m_Error)
     {
         // Failed to apply the backend-specific optimizations
         return IOptimizedNetworkPtr(nullptr, &IOptimizedNetwork::Destroy);
     }

     // Based on the tensor handle strategy determined above, insert copy layers where required.
     optGraph.AddCompatibilityLayers(backends, tensorHandleFactoryRegistry);

     // Convert constants
     Optimizer::Pass(optGraph, MakeOptimizations(ConvertConstantsFloatToHalf()));
     Optimizer::Pass(optGraph, MakeOptimizations(ConvertConstantsHalfToFloat()));

     // Run backend specific optimizations (deprecated)
     for (auto&& chosenBackend : backendSettings.m_SelectedBackends)
     {
         auto factoryFun = BackendRegistryInstance().GetFactory(chosenBackend);
         auto backendPtr = factoryFun();
         ARMNN_ASSERT(backendPtr.get() != nullptr);

         ARMNN_NO_DEPRECATE_WARN_BEGIN
         auto backendSpecificOptimizations = backendPtr->GetOptimizations();
         ARMNN_NO_DEPRECATE_WARN_END

         if (!backendSpecificOptimizations.empty())
         {
             Optimizer::Pass(optNetObjPtr->GetGraph(), backendSpecificOptimizations);
         }
     }

     return optNet;
 }
 bool Network::GetShapeInferenceMethod()
 {
     if (m_NetworkOptions.size() > 0 && m_NetworkOptions[0].GetBackendId().Get() == "ShapeInferenceMethod")
     {
         return m_NetworkOptions[0].GetOption(0).GetValue().AsBool();
     }

     return false;
 }
 Network::Network(NetworkOptions networkOptions)
 : m_NetworkOptions(networkOptions),
   m_Graph(std::make_unique<Graph>(GetShapeInferenceMethod()))
 {}

 Network::~Network()
 {
 }

 Status Network::PrintGraph()
 {
     m_Graph->Print();
     return Status::Success;
 }

 IConnectableLayer* Network::AddInputLayer(LayerBindingId id, const char* name)
 {
     return m_Graph->AddLayer<InputLayer>(id, name);
 }

 IConnectableLayer* Network::AddBatchToSpaceNdLayer(const BatchToSpaceNdDescriptor& batchToSpaceNdDescriptor,
                                             const char* name)
 {
     return m_Graph->AddLayer<BatchToSpaceNdLayer>(batchToSpaceNdDescriptor, name);
 }

 IConnectableLayer* Network::AddComparisonLayer(const ComparisonDescriptor& comparisonDescriptor,
                                                const char* name)
 {
     return m_Graph->AddLayer<ComparisonLayer>(comparisonDescriptor, name);
 }

 IConnectableLayer* Network::AddElementwiseUnaryLayer(const ElementwiseUnaryDescriptor& elementwiseUnaryDescriptor,
                                                      const char* name)
 {
     return m_Graph->AddLayer<ElementwiseUnaryLayer>(elementwiseUnaryDescriptor, name);
 }

 IConnectableLayer* Network::AddFillLayer(const FillDescriptor& fillDescriptor,
                                          const char* name)
 {
     return m_Graph->AddLayer<FillLayer>(fillDescriptor, name);
 }

 IConnectableLayer* Network::AddFullyConnectedLayerImpl(const FullyConnectedDescriptor& fullyConnectedDescriptor,
                                                        const ConstTensor& weights,
                                                        const Optional<ConstTensor>& biases,
                                                        const char* name)
 {
     if (fullyConnectedDescriptor.m_BiasEnabled && !biases.has_value())
     {
         throw InvalidArgumentException("AddFullyConnectedLayer: biases cannot be empty");
     }

     const auto layer = m_Graph->AddLayer<FullyConnectedLayer>(fullyConnectedDescriptor, name);

     layer->m_Weight = std::make_unique<ScopedCpuTensorHandle>(weights);

     if (fullyConnectedDescriptor.m_BiasEnabled)
     {
         layer->m_Bias = std::make_unique<ScopedCpuTensorHandle>(biases.value());
     }

     return layer;
 }

 IConnectableLayer* Network::AddFullyConnectedLayer(const FullyConnectedDescriptor& fullyConnectedDescriptor,
                                                    const ConstTensor& weights,
                                                    const Optional<ConstTensor>& biases,
                                                    const char* name)
 {
     return AddFullyConnectedLayerImpl(fullyConnectedDescriptor, weights, biases, name);
 }

 IConnectableLayer* Network::AddFullyConnectedLayer(const FullyConnectedDescriptor& fullyConnectedDescriptor,
                                                    const ConstTensor& weights,
                                                    const char* name)
 {
     Optional<ConstTensor> biases;
     return AddFullyConnectedLayerImpl(fullyConnectedDescriptor, weights, biases, name);
 }

 IConnectableLayer* Network::AddFullyConnectedLayer(const FullyConnectedDescriptor& fullyConnectedDescriptor,
                                                    const ConstTensor& weights,
                                                    const ConstTensor& biases,
                                                    const char* name)
 {
     Optional<ConstTensor> optionalBiases(biases);
     return AddFullyConnectedLayerImpl(fullyConnectedDescriptor, weights, optionalBiases, name);
 }

 IConnectableLayer* Network::AddConcatLayer(const ConcatDescriptor& concatDescriptor,
                                            const char* name)
 {
     return m_Graph->AddLayer<ConcatLayer>(concatDescriptor, name);
 }

 IConnectableLayer* Network::AddConvolution2dLayerImpl(const Convolution2dDescriptor& convolution2dDescriptor,
                                                       const ConstTensor& weights,
                                                       const Optional<ConstTensor>& biases,
                                                       const char* name)
 {
     if (convolution2dDescriptor.m_BiasEnabled && !biases.has_value())
     {
         throw InvalidArgumentException("AddConvolution2dLayer: biases cannot be empty");
     }

     const auto layer = m_Graph->AddLayer<Convolution2dLayer>(convolution2dDescriptor, name);

     layer->m_Weight = std::make_unique<ScopedCpuTensorHandle>(weights);

     if (convolution2dDescriptor.m_BiasEnabled)
     {
         layer->m_Bias = std::make_unique<ScopedCpuTensorHandle>(biases.value());
     }

     return layer;
 }

 IConnectableLayer* Network::AddConvolution2dLayer(const Convolution2dDescriptor& convolution2dDescriptor,
                                                   const ConstTensor& weights,
                                                   const Optional<ConstTensor>& biases,
                                                   const char* name)
 {
     return AddConvolution2dLayerImpl(convolution2dDescriptor, weights, biases, name);
 }

 IConnectableLayer* Network::AddConvolution2dLayer(const Convolution2dDescriptor& convolution2dDescriptor,
                                                   const ConstTensor& weights,
                                                   const char* name)
 {
     Optional<ConstTensor> biases;
     return AddConvolution2dLayerImpl(convolution2dDescriptor, weights, biases, name);
 }

 IConnectableLayer* Network::AddConvolution2dLayer(const Convolution2dDescriptor& convolution2dDescriptor,
                                                   const ConstTensor& weights,
                                                   const ConstTensor& biases,
                                                   const char* name)
 {
     Optional<ConstTensor> optionalBiases(biases);
     return AddConvolution2dLayerImpl(convolution2dDescriptor, weights, optionalBiases, name);
 }

 IConnectableLayer* Network::AddDepthwiseConvolution2dLayerImpl(
     const DepthwiseConvolution2dDescriptor& convolution2dDescriptor,
     const ConstTensor& weights,
     const Optional<ConstTensor>& biases,
     const char* name)
 {
     if (convolution2dDescriptor.m_BiasEnabled && !biases.has_value())
     {
         throw InvalidArgumentException("AddDepthwiseConvolution2dLayer: biases cannot be empty");
     }

     const auto layer = m_Graph->AddLayer<DepthwiseConvolution2dLayer>(convolution2dDescriptor, name);

     layer->m_Weight = std::make_unique<ScopedCpuTensorHandle>(weights);

     if (convolution2dDescriptor.m_BiasEnabled)
     {
         layer->m_Bias = std::make_unique<ScopedCpuTensorHandle>(biases.value());
     }

     return layer;
 }

 IConnectableLayer* Network::AddDepthToSpaceLayer(const DepthToSpaceDescriptor& depthToSpaceDescriptor,
                                                  const char* name)
 {
     return m_Graph->AddLayer<DepthToSpaceLayer>(depthToSpaceDescriptor, name);
 }

 IConnectableLayer* Network::AddDepthwiseConvolution2dLayer(
         const DepthwiseConvolution2dDescriptor& convolution2dDescriptor,
         const ConstTensor& weights,
         const Optional<ConstTensor>& biases,
         const char* name)
 {
     return AddDepthwiseConvolution2dLayerImpl(convolution2dDescriptor, weights, biases, name);
 }

 IConnectableLayer* Network::AddDepthwiseConvolution2dLayer(
     const DepthwiseConvolution2dDescriptor& convolution2dDescriptor,
     const ConstTensor& weights,
     const char* name)
 {
     Optional<ConstTensor> biases;
     return AddDepthwiseConvolution2dLayerImpl(convolution2dDescriptor, weights, biases, name);
 }

 IConnectableLayer* Network::AddDepthwiseConvolution2dLayer(
     const DepthwiseConvolution2dDescriptor& convolution2dDescriptor,
     const ConstTensor& weights,
     const ConstTensor& biases,
     const char* name)
 {
     Optional<ConstTensor> optionalBiases(biases);
     return AddDepthwiseConvolution2dLayerImpl(convolution2dDescriptor, weights, optionalBiases, name);
 }

 IConnectableLayer* Network::AddDetectionPostProcessLayer(const armnn::DetectionPostProcessDescriptor& descriptor,
                                                          const ConstTensor& anchors, const char* name)
 {
     const auto layer = m_Graph->AddLayer<DetectionPostProcessLayer>(descriptor, name);

     layer->m_Anchors = std::make_unique<ScopedCpuTensorHandle>(anchors);

     return layer;
 }

 IConnectableLayer* Network::AddPermuteLayer(const PermuteDescriptor& permuteDescriptor,
                                             const char* name)
 {
     return m_Graph->AddLayer<PermuteLayer>(permuteDescriptor, name);
 }

 IConnectableLayer* Network::AddPooling2dLayer(const Pooling2dDescriptor& pooling2dDescriptor,
     const char* name)
 {
     return m_Graph->AddLayer<Pooling2dLayer>(pooling2dDescriptor, name);
 }

 IConnectableLayer* Network::AddActivationLayer(const ActivationDescriptor& activationDescriptor,
     const char* name)
 {
     return m_Graph->AddLayer<ActivationLayer>(activationDescriptor, name);
 }

 IConnectableLayer* Network::AddArgMinMaxLayer(const ArgMinMaxDescriptor& argMinMaxDescriptor,
                                               const char* name)
 {
     return m_Graph->AddLayer<ArgMinMaxLayer>(argMinMaxDescriptor, name);
 }

 IConnectableLayer* Network::AddNormalizationLayer(const NormalizationDescriptor&
 normalizationDescriptor,
     const char* name)
 {
     return m_Graph->AddLayer<NormalizationLayer>(normalizationDescriptor, name);
 }

 IConnectableLayer* Network::AddSliceLayer(const SliceDescriptor& sliceDescriptor, const char* name)
 {
     return m_Graph->AddLayer<SliceLayer>(sliceDescriptor, name);
 }

 IConnectableLayer* Network::AddSoftmaxLayer(const SoftmaxDescriptor& softmaxDescriptor,
     const char* name)
 {
     return m_Graph->AddLayer<SoftmaxLayer>(softmaxDescriptor, name);
 }

 IConnectableLayer* Network::AddSplitterLayer(const ViewsDescriptor& splitterDescriptor,
     const char* name)
 {
     return m_Graph->AddLayer<SplitterLayer>(splitterDescriptor, name);
 }

 IConnectableLayer* Network::AddMaximumLayer(const char* name)
 {
     return m_Graph->AddLayer<MaximumLayer>(name);
 }

 IConnectableLayer* Network::AddMinimumLayer(const char* name)
 {
     return m_Graph->AddLayer<MinimumLayer>(name);
 }

 IConnectableLayer* Network::AddMergerLayer(const MergerDescriptor& mergerDescriptor,
                                            const char* name)
 {
     return AddConcatLayer(mergerDescriptor, name);
 }

 IConnectableLayer* Network::AddAbsLayer(const char * name)
 {
     return AddElementwiseUnaryLayer(ElementwiseUnaryDescriptor(UnaryOperation::Abs), name);
 }

 IConnectableLayer* Network::AddAdditionLayer(const char* name)
 {
     return m_Graph->AddLayer<AdditionLayer>(name);
 }

 IConnectableLayer* Network::AddMultiplicationLayer(const char* name)
 {
     return m_Graph->AddLayer<MultiplicationLayer>(name);
 }

 IConnectableLayer* Network::AddOutputLayer(LayerBindingId id, const char* name)
 {
     return m_Graph->AddLayer<OutputLayer>(id, name);
 }

 IConnectableLayer* Network::AddBatchNormalizationLayer(const BatchNormalizationDescriptor& desc,
                                                        const ConstTensor&                  mean,
                                                        const ConstTensor&                  variance,
                                                        const ConstTensor&                  beta,
                                                        const ConstTensor&                  gamma,
                                                        const char*                         name)
 {
     const auto layer = m_Graph->AddLayer<BatchNormalizationLayer>(desc, name);

     layer->m_Mean = std::make_unique<ScopedCpuTensorHandle>(mean);
     layer->m_Variance = std::make_unique<ScopedCpuTensorHandle>(variance);
     layer->m_Beta = std::make_unique<ScopedCpuTensorHandle>(beta);
     layer->m_Gamma = std::make_unique<ScopedCpuTensorHandle>(gamma);

     return layer;
 }

 IConnectableLayer* Network::AddRankLayer(const char* name)
 {
     return m_Graph->AddLayer<RankLayer>(name);
 }

 IConnectableLayer* Network::AddResizeBilinearLayer(const ResizeBilinearDescriptor& descriptor,
                                                    const char* name)
 {
     ResizeDescriptor resizeDescriptor;
     resizeDescriptor.m_Method           = ResizeMethod::Bilinear;
     resizeDescriptor.m_DataLayout       = descriptor.m_DataLayout;
     resizeDescriptor.m_TargetWidth      = descriptor.m_TargetWidth;
     resizeDescriptor.m_TargetHeight     = descriptor.m_TargetHeight;
     resizeDescriptor.m_AlignCorners     = descriptor.m_AlignCorners;
     resizeDescriptor.m_HalfPixelCenters = descriptor.m_HalfPixelCenters;

     return m_Graph->AddLayer<ResizeLayer>(resizeDescriptor, name);
 }

 IConnectableLayer* Network::AddResizeLayer(const ResizeDescriptor&
 resizeDescriptor, const char* name)
 {
     return m_Graph->AddLayer<ResizeLayer>(resizeDescriptor, name);
 }

 IConnectableLayer* Network::AddInstanceNormalizationLayer(const InstanceNormalizationDescriptor& desc,
                                                           const char* name)
 {
     return m_Graph->AddLayer<InstanceNormalizationLayer>(desc, name);
 }

 IConnectableLayer* Network::AddL2NormalizationLayer(const L2NormalizationDescriptor& desc,
                                                     const char* name)
 {
     return m_Graph->AddLayer<L2NormalizationLayer>(desc, name);
 }

 IConnectableLayer* Network::AddLogSoftmaxLayer(const LogSoftmaxDescriptor& desc,
                                                const char* name)
 {
     return m_Graph->AddLayer<LogSoftmaxLayer>(desc, name);
 }

 IConnectableLayer* Network::AddConstantLayer(const ConstTensor& input, const char* name)
 {
     auto layer = m_Graph->AddLayer<ConstantLayer>(name);

     layer->m_LayerOutput = std::make_unique<ScopedCpuTensorHandle>(input);

     return layer;
 }

 IConnectableLayer* Network::AddReshapeLayer(const ReshapeDescriptor& reshapeDescriptor,
                                             const char* name)
 {
     return m_Graph->AddLayer<ReshapeLayer>(reshapeDescriptor, name);
 }

 IConnectableLayer* Network::AddSpaceToBatchNdLayer(const SpaceToBatchNdDescriptor& spaceToBatchNdDescriptor,
                                                    const char* name)
 {
     return m_Graph->AddLayer<SpaceToBatchNdLayer>(spaceToBatchNdDescriptor, name);
 }

 IConnectableLayer* Network::AddSpaceToDepthLayer(const SpaceToDepthDescriptor& spaceToDepthDescriptor,
                                                  const char* name)
 {
     return m_Graph->AddLayer<SpaceToDepthLayer>(spaceToDepthDescriptor, name);
 }

 IConnectableLayer* Network::AddFloorLayer(const char* name)
 {
     return m_Graph->AddLayer<FloorLayer>(name);
 }

 IConnectableLayer* Network::AddLstmLayer(const LstmDescriptor&  descriptor,
                                          const LstmInputParams& params,
                                          const char* name)
 {
     const auto layer = m_Graph->AddLayer<LstmLayer>(descriptor, name);

     //Lstm Basic Parameters
     layer->m_BasicParameters.m_InputToForgetWeights =
         std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToForgetWeights));
     layer->m_BasicParameters.m_InputToCellWeights =
         std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToCellWeights));
     layer->m_BasicParameters.m_InputToOutputWeights =
         std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToOutputWeights));
     layer->m_BasicParameters.m_RecurrentToForgetWeights =
         std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToForgetWeights));
     layer->m_BasicParameters.m_RecurrentToCellWeights =
         std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToCellWeights));
     layer->m_BasicParameters.m_RecurrentToOutputWeights =
         std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToOutputWeights));
     layer->m_BasicParameters.m_ForgetGateBias =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_ForgetGateBias));
     layer->m_BasicParameters.m_CellBias =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellBias));
     layer->m_BasicParameters.m_OutputGateBias =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_OutputGateBias));

     //Lstm Cifg parameters
     if(!descriptor.m_CifgEnabled)
     {
         if(params.m_InputToInputWeights == nullptr)
         {
             throw InvalidArgumentException("AddLstmLayer: Input To Input Weights cannot be NULL "
                                            "when CIFG is disabled.");
         }
         if(params.m_RecurrentToInputWeights == nullptr)
         {
             throw InvalidArgumentException(
                     "AddLstmLayer: Recurrent To Input Weights cannot be NULL "
                     "when CIFG is disabled.");
         }
         if(params.m_InputGateBias == nullptr)
         {
             throw InvalidArgumentException("AddLstmLayer: Input Gate Bias cannot be NULL "
                                            "when CIFG is disabled.");
         }
         layer->m_CifgParameters.m_InputToInputWeights =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToInputWeights));
         layer->m_CifgParameters.m_RecurrentToInputWeights =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToInputWeights));
         layer->m_CifgParameters.m_InputGateBias =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputGateBias));
     }

     //Lstm projection parameters
     if(descriptor.m_ProjectionEnabled)
     {
         if(params.m_ProjectionWeights == nullptr)
         {
             throw InvalidArgumentException("AddLstmLayer: Projection Weights cannot be NULL "
                                            "when projection is enabled.");
         }
         layer->m_ProjectionParameters.m_ProjectionWeights =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_ProjectionWeights));
         if(params.m_ProjectionBias != nullptr)
         {
             layer->m_ProjectionParameters.m_ProjectionBias =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_ProjectionBias));
         }
     }

     //Lstm Peephole params
     if(descriptor.m_PeepholeEnabled)
     {
         if(!descriptor.m_CifgEnabled)
         {
             if(params.m_CellToInputWeights == nullptr)
             {
                 throw InvalidArgumentException("AddLstmLayer: Cell To Input Weights cannot be NULL "
                                                "when Peephole is enabled and CIFG disabled.");
             }

             layer->m_PeepholeParameters.m_CellToInputWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToInputWeights));
         }

         if(params.m_CellToForgetWeights == nullptr)
         {
             throw InvalidArgumentException("AddLstmLayer: Cell To Forget Weights cannot be NULL "
                                            "when Peephole is enabled.");
         }
         if(params.m_CellToOutputWeights == nullptr)
         {
             throw InvalidArgumentException("AddLstmLayer: Cell To Output Weights cannot be NULL "
                                            "when Peephole is enabled.");
         }

         layer->m_PeepholeParameters.m_CellToForgetWeights =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToForgetWeights));
         layer->m_PeepholeParameters.m_CellToOutputWeights =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToOutputWeights));
     }

     //Lstm Layer Normalization params
     if(descriptor.m_LayerNormEnabled)
     {
         if(!descriptor.m_CifgEnabled)
         {
             if(params.m_InputLayerNormWeights == nullptr)
             {
                 throw InvalidArgumentException("AddLstmLayer: Input layer normalization weights cannot be NULL "
                                                "when layer normalization is enabled and CIFG disabled.");
             }
             layer->m_LayerNormParameters.m_InputLayerNormWeights =
                     std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputLayerNormWeights));
         }

         if(params.m_ForgetLayerNormWeights == nullptr)
         {
             throw InvalidArgumentException("AddLstmLayer: Forget layer normalization weights cannot be NULL "
                                            "when layer normalization is enabled.");
         }
         if(params.m_CellLayerNormWeights == nullptr)
         {
             throw InvalidArgumentException("AddLstmLayer: Cell layer normalization weights cannot be NULL "
                                            "when layer normalization is enabled.");
         }
         if(params.m_OutputLayerNormWeights == nullptr)
         {
             throw InvalidArgumentException("AddLstmLayer: Output layer normalization weights cannot be NULL "
                                            "when layer normalization is enabled.");
         }
         layer->m_LayerNormParameters.m_ForgetLayerNormWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_ForgetLayerNormWeights));
         layer->m_LayerNormParameters.m_CellLayerNormWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellLayerNormWeights));
         layer->m_LayerNormParameters.m_OutputLayerNormWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_OutputLayerNormWeights));
     }
     return layer;
 }

 IConnectableLayer* Network::AddDivisionLayer(const char* name)
 {
     return m_Graph->AddLayer<DivisionLayer>(name);
 }

 IConnectableLayer* Network::AddSubtractionLayer(const char* name)
 {
     return m_Graph->AddLayer<SubtractionLayer>(name);
 }

 IConnectableLayer* Network::AddMeanLayer(const MeanDescriptor& meanDescriptor, const char* name)
 {
     return m_Graph->AddLayer<MeanLayer>(meanDescriptor,name);
 }

 IConnectableLayer* Network::AddPadLayer(const PadDescriptor& padDescriptor, const char* name)
 {
     return m_Graph->AddLayer<PadLayer>(padDescriptor,name);
 }

 IConnectableLayer *Network::AddQuantizeLayer(const char *name)
 {
     return m_Graph->AddLayer<QuantizeLayer>(name);
 }

 IConnectableLayer* Network::AddDequantizeLayer(const char* name)
 {
     return m_Graph->AddLayer<DequantizeLayer>(name);
 }

 IConnectableLayer* Network::AddStridedSliceLayer(const StridedSliceDescriptor& stridedSliceDescriptor,
                                                  const char* name)
 {
     return m_Graph->AddLayer<StridedSliceLayer>(stridedSliceDescriptor, name);
 }

 IConnectableLayer* Network::AddGreaterLayer(const char* name)
 {
     return AddComparisonLayer(ComparisonDescriptor(ComparisonOperation::Greater), name);
 }

 IConnectableLayer* Network::AddEqualLayer(const char* name)
 {
     return AddComparisonLayer(ComparisonDescriptor(ComparisonOperation::Equal), name);
 }

 IConnectableLayer* Network::AddRsqrtLayer(const char * name)
 {
     return AddElementwiseUnaryLayer(ElementwiseUnaryDescriptor(UnaryOperation::Rsqrt), name);
 }

 IConnectableLayer* Network::AddGatherLayer(const char* name)
 {
     GatherDescriptor gatherDescriptor{};
     return AddGatherLayer(gatherDescriptor, name);
 }

 IConnectableLayer* Network::AddGatherLayer(const GatherDescriptor& gatherDescriptor,
                                            const char* name)
 {
     return m_Graph->AddLayer<GatherLayer>(gatherDescriptor, name);
 }

 IConnectableLayer* Network::AddMergeLayer(const char* name)
 {
     return m_Graph->AddLayer<MergeLayer>(name);
 }

 IConnectableLayer* Network::AddSwitchLayer(const char* name)
 {
     return m_Graph->AddLayer<SwitchLayer>(name);
 }

 IConnectableLayer* Network::AddPreluLayer(const char* name)
 {
     return m_Graph->AddLayer<PreluLayer>(name);
 }

 IConnectableLayer* Network::AddTransposeConvolution2dLayer(const TransposeConvolution2dDescriptor& descriptor,
                                                            const ConstTensor& weights,
                                                            const Optional<ConstTensor>& biases,
                                                            const char* name)
 {
     if (descriptor.m_BiasEnabled && !biases.has_value())
     {
         throw InvalidArgumentException("AddTransposeConvolution2dLayer: Biases cannot be empty");
     }

     const auto layer = m_Graph->AddLayer<TransposeConvolution2dLayer>(descriptor, name);

     layer->m_Weight = std::make_unique<ScopedCpuTensorHandle>(weights);

     if (descriptor.m_BiasEnabled)
     {
         layer->m_Bias = std::make_unique<ScopedCpuTensorHandle>(biases.value());
     }

     return layer;
 }

 IConnectableLayer* Network::AddTransposeLayer(const TransposeDescriptor& transposeDescriptor,
                                               const char* name)
 {
     return m_Graph->AddLayer<TransposeLayer>(transposeDescriptor, name);
 }

 IConnectableLayer* Network::AddStackLayer(const StackDescriptor& stackDescriptor,
                                           const char* name)
 {
     return m_Graph->AddLayer<StackLayer>(stackDescriptor, name);
 }


 IConnectableLayer* Network::AddStandInLayer(const StandInDescriptor& desc,
                                             const char* name)
 {
     return m_Graph->AddLayer<StandInLayer>(desc, name);
 }

 IConnectableLayer* Network::AddQuantizedLstmLayer(const QuantizedLstmInputParams& params,
                                                   const char* name)
 {
     const auto layer = m_Graph->AddLayer<QuantizedLstmLayer>(name);

     // InputToX weights
     layer->m_QuantizedLstmParameters.m_InputToInputWeights =
             std::make_unique<ScopedCpuTensorHandle>(params.GetInputToInputWeights());
     layer->m_QuantizedLstmParameters.m_InputToForgetWeights =
             std::make_unique<ScopedCpuTensorHandle>(params.GetInputToForgetWeights());
     layer->m_QuantizedLstmParameters.m_InputToCellWeights =
             std::make_unique<ScopedCpuTensorHandle>(params.GetInputToCellWeights());
     layer->m_QuantizedLstmParameters.m_InputToOutputWeights =
             std::make_unique<ScopedCpuTensorHandle>(params.GetInputToOutputWeights());

     // RecurrentToX weights
     layer->m_QuantizedLstmParameters.m_RecurrentToInputWeights =
             std::make_unique<ScopedCpuTensorHandle>(params.GetRecurrentToInputWeights());
     layer->m_QuantizedLstmParameters.m_RecurrentToForgetWeights =
             std::make_unique<ScopedCpuTensorHandle>(params.GetRecurrentToForgetWeights());
     layer->m_QuantizedLstmParameters.m_RecurrentToCellWeights =
             std::make_unique<ScopedCpuTensorHandle>(params.GetRecurrentToCellWeights());
     layer->m_QuantizedLstmParameters.m_RecurrentToOutputWeights =
             std::make_unique<ScopedCpuTensorHandle>(params.GetRecurrentToOutputWeights());

     // Bias
     layer->m_QuantizedLstmParameters.m_InputGateBias =
             std::make_unique<ScopedCpuTensorHandle>(params.GetInputGateBias());
     layer->m_QuantizedLstmParameters.m_ForgetGateBias =
             std::make_unique<ScopedCpuTensorHandle>(params.GetForgetGateBias());
     layer->m_QuantizedLstmParameters.m_CellBias =
             std::make_unique<ScopedCpuTensorHandle>(params.GetCellBias());
     layer->m_QuantizedLstmParameters.m_OutputGateBias =
             std::make_unique<ScopedCpuTensorHandle>(params.GetOutputGateBias());

     return layer;
 }

 IConnectableLayer* Network::AddQLstmLayer(const QLstmDescriptor&  descriptor,
                                           const LstmInputParams& params,
                                           const char* name)
 {
     const auto layer = m_Graph->AddLayer<QLstmLayer>(descriptor, name);

     // QLstm Basic Parameters
     layer->m_BasicParameters.m_InputToForgetWeights =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToForgetWeights));
     layer->m_BasicParameters.m_InputToCellWeights =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToCellWeights));
     layer->m_BasicParameters.m_InputToOutputWeights =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToOutputWeights));
     layer->m_BasicParameters.m_RecurrentToForgetWeights =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToForgetWeights));
     layer->m_BasicParameters.m_RecurrentToCellWeights =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToCellWeights));
     layer->m_BasicParameters.m_RecurrentToOutputWeights =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToOutputWeights));
     layer->m_BasicParameters.m_ForgetGateBias =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_ForgetGateBias));
     layer->m_BasicParameters.m_CellBias =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellBias));
     layer->m_BasicParameters.m_OutputGateBias =
             std::make_unique<ScopedCpuTensorHandle>(*(params.m_OutputGateBias));

     // QLstm Cifg parameters
     if(!descriptor.m_CifgEnabled)
     {
         if(params.m_InputToInputWeights == nullptr)
         {
             throw InvalidArgumentException("AddQLstmLayer: Input To Input Weights cannot be NULL");
         }

         if(params.m_RecurrentToInputWeights == nullptr)
         {
             throw InvalidArgumentException(
                     "AddQLstmLayer: Recurrent To Input Weights cannot be NULL");
         }

         if(params.m_InputGateBias == nullptr)
         {
             throw InvalidArgumentException("AddQLstmLayer: Input Gate Bias cannot be NULL");
         }

         layer->m_CifgParameters.m_InputToInputWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputToInputWeights));
         layer->m_CifgParameters.m_RecurrentToInputWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_RecurrentToInputWeights));
         layer->m_CifgParameters.m_InputGateBias =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputGateBias));
     }

     // QLstm Projection parameters
     if(descriptor.m_ProjectionEnabled)
     {
         if(params.m_ProjectionWeights == nullptr)
         {
             throw InvalidArgumentException("AddQLstmLayer: Projection Weights cannot be NULL");
         }

         layer->m_ProjectionParameters.m_ProjectionWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_ProjectionWeights));

         // Projection bias is optional even if projection is enabled
         if(params.m_ProjectionWeights != nullptr)
         {
             layer->m_ProjectionParameters.m_ProjectionBias =
                     std::make_unique<ScopedCpuTensorHandle>(*(params.m_ProjectionBias));
         }

     }

     // QLstm Peephole params
     if(descriptor.m_PeepholeEnabled)
     {
         if(params.m_CellToForgetWeights == nullptr)
         {
             throw InvalidArgumentException("AddQLstmLayer: Cell To Forget Weights cannot be NULL");
         }

         if(params.m_CellToOutputWeights == nullptr)
         {
             throw InvalidArgumentException("AddQLstmLayer: Cell To Output Weights cannot be NULL");
         }

         if(!descriptor.m_CifgEnabled)
         {
             if(params.m_CellToInputWeights == nullptr)
             {
                 throw InvalidArgumentException("AddQLstmLayer: Cell To Input Weights cannot be NULL");
             }

             layer->m_PeepholeParameters.m_CellToInputWeights =
                     std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToInputWeights));
         }

         layer->m_PeepholeParameters.m_CellToForgetWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToForgetWeights));
         layer->m_PeepholeParameters.m_CellToOutputWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellToOutputWeights));
     }

     // QLstm Layer Normalization params
     if(descriptor.m_LayerNormEnabled)
     {
         if(params.m_ForgetLayerNormWeights == nullptr)
         {
             throw InvalidArgumentException("AddQLstmLayer: Forget layer normalization weights cannot be NULL");
         }

         if(params.m_CellLayerNormWeights == nullptr)
         {
             throw InvalidArgumentException("AddQLstmLayer: Cell layer normalization weights cannot be NULL");
         }

         if(params.m_OutputLayerNormWeights == nullptr)
         {
             throw InvalidArgumentException("AddQLstmLayer: Output layer normalization weights cannot be NULL");
         }

         if(!descriptor.m_CifgEnabled)
         {
             if(params.m_InputLayerNormWeights == nullptr)
             {
                 throw InvalidArgumentException("AddQLstmLayer: Input layer normalization weights cannot be NULL");
             }

             layer->m_LayerNormParameters.m_InputLayerNormWeights =
                     std::make_unique<ScopedCpuTensorHandle>(*(params.m_InputLayerNormWeights));
         }

         layer->m_LayerNormParameters.m_ForgetLayerNormWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_ForgetLayerNormWeights));
         layer->m_LayerNormParameters.m_CellLayerNormWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_CellLayerNormWeights));
         layer->m_LayerNormParameters.m_OutputLayerNormWeights =
                 std::make_unique<ScopedCpuTensorHandle>(*(params.m_OutputLayerNormWeights));
     }
     return layer;
 }

 void Network::Accept(ILayerVisitor& visitor) const
 {
     for (auto layer : GetGraph())
     {
         layer->Accept(visitor);
     };
 }

 OptimizedNetwork::OptimizedNetwork(std::unique_ptr<Graph> graph)
     : m_Graph(std::move(graph)), m_Guid(profiling::ProfilingService::GetNextGuid())
 {
 }

 OptimizedNetwork::~OptimizedNetwork()
 {
 }

 } // namespace armnn
armnn::ConstantLayer
A layer that the constant data can be bound to.
Definition: ConstantLayer.hpp:15

armnn::optimizations::SquashEqualPermuteSiblings
OptimizeForConnection< Layer, PermuteLayer, SquashEqualSiblingsImpl< PermuteLayer > > SquashEqualPermuteSiblings
Definition: SquashEqualSiblings.hpp:67

armnn::ReportError
void ReportError(const std::string &errorMessage, Optional< std::vector< std::string > &> errorMessages)
Definition: Network.cpp:76

armnn::Convolution2dDescriptor::m_BiasEnabled
bool m_BiasEnabled
Enable/disable bias.
Definition: Descriptors.hpp:446

armnn::Network::~Network
~Network()
Definition: Network.cpp:1176

DeviceSpec.hpp

IgnoreUnused.hpp

armnn::ComparisonOperation::Greater

armnn::ResizeBilinearDescriptor::m_HalfPixelCenters
bool m_HalfPixelCenters
Half Pixel Centers.
Definition: Descriptors.hpp:773

armnn::Network::AddPooling2dLayer
IConnectableLayer * AddPooling2dLayer(const Pooling2dDescriptor &pooling2dDescriptor, const char *name=nullptr) override
Adds a pooling layer to the network.
Definition: Network.cpp:1388

armnn::ResizeBilinearDescriptor::m_AlignCorners
bool m_AlignCorners
Aligned corners.
Definition: Descriptors.hpp:771

armnn::MinimumLayer
This layer represents a minimum operation.
Definition: MinimumLayer.hpp:14

armnn::ITensorHandleFactory::DeferredFactoryId
static const FactoryId DeferredFactoryId
Use the workload factory to create the tensor handle.
Definition: ITensorHandleFactory.hpp:46

armnn::SplitterLayer
This layer represents a split operation.
Definition: SplitterLayer.hpp:13

armnn::LstmLayer::m_BasicParameters
LstmBasicParameters m_BasicParameters
Definition: LstmLayer.hpp:81

armnn::LstmInputParams::m_ProjectionWeights
const ConstTensor * m_ProjectionWeights
Definition: LstmParams.hpp:55

armnn::OutputSlot::GetConnections
const std::vector< InputSlot * > & GetConnections() const
Definition: Layer.hpp:125

armnn::QuantizedLstmInputParams::GetRecurrentToOutputWeights
const ConstTensor & GetRecurrentToOutputWeights() const
Definition: QuantizedLstmParams.hpp:93

armnn::BackendRegistry::GetFactory
FactoryFunction GetFactory(const BackendId &id) const
Definition: BackendRegistry.cpp:54

armnn::BatchNormalizationLayer
This layer represents a batch normalization operation.
Definition: BatchNormalizationLayer.hpp:15

armnn::INetwork::Destroy
static void Destroy(INetwork *network)
Definition: Network.cpp:55

armnn::ViewsDescriptor
A ViewsDescriptor for the SplitterLayer.
Definition: Descriptors.hpp:198

armnn::IConnectableLayer
Interface for a layer that is connectable to other layers via InputSlots and OutputSlots.
Definition: INetwork.hpp:61

armnn::optimizations::OptimizeInversePermutes
OptimizeForConnection< PermuteLayer, PermuteLayer, OptimizeInversePermutesImpl< PermuteLayer > > OptimizeInversePermutes
Definition: OptimizeInversePermutes.hpp:43

armnn::ITensorHandleFactory::SupportsMapUnmap
virtual bool SupportsMapUnmap() const final
Definition: ITensorHandleFactory.hpp:81

armnn::LstmInputParams::m_CellBias
const ConstTensor * m_CellBias
Definition: LstmParams.hpp:53

armnn::InsertConvertFp32ToFp16LayersAfter
std::vector< ConvertFp32ToFp16Layer * > InsertConvertFp32ToFp16LayersAfter(Graph &graph, Layer &layer)
Definition: NetworkUtils.cpp:201

armnn::DepthwiseConvolution2dDescriptor::m_BiasEnabled
bool m_BiasEnabled
Enable/disable bias.
Definition: Descriptors.hpp:498

armnn::Network::AddOutputLayer
IConnectableLayer * AddOutputLayer(LayerBindingId id, const char *name=nullptr) override
Adds an output layer to the network.
Definition: Network.cpp:1461

armnn::Network::AddRankLayer
IConnectableLayer * AddRankLayer(const char *name=nullptr) override
Adds a rank layer to the network.
Definition: Network.cpp:1483

armnn::OutputSlot::SetEdgeStrategy
void SetEdgeStrategy(unsigned int connectionIndex, EdgeStrategy strategy)
Definition: Layer.cpp:182

armnn::QuantizedLstmLayer::m_QuantizedLstmParameters
QuantizedLstmParameters m_QuantizedLstmParameters
Definition: QuantizedLstmLayer.hpp:49

armnn::TransposeConvolution2dLayer
This layer represents a 2D transpose convolution operation.
Definition: TransposeConvolution2dLayer.hpp:15

armnn::EdgeStrategy::DirectCompatibility
No strategy has been defined. Used internally to verify integrity of optimizations.

armnn::InsertConvertFp16ToFp32LayersBefore
std::vector< ConvertFp16ToFp32Layer * > InsertConvertFp16ToFp32LayersBefore(Graph &graph, Layer &layer, bool expectCorrectInputType)
Definition: NetworkUtils.cpp:129

armnn::Network::AddL2NormalizationLayer
IConnectableLayer * AddL2NormalizationLayer(const L2NormalizationDescriptor &desc, const char *name=nullptr) override
Adds an L2 normalization layer to the network.
Definition: Network.cpp:1514

armnn::TransposeConvolution2dDescriptor
A TransposeConvolution2dDescriptor for the TransposeConvolution2dLayer.
Definition: Descriptors.hpp:1196

armnn::TensorInfo::GetShape
const TensorShape & GetShape() const
Definition: Tensor.hpp:187

armnn::Compute::CpuRef
CPU Execution: Reference C++ kernels.

Utils.hpp

armnn::MakeOptimizations
Optimizer::Optimizations MakeOptimizations(Args &&... args)
Definition: Optimizer.hpp:43

armnn::FullyConnectedLayer::m_Weight
std::unique_ptr< ScopedCpuTensorHandle > m_Weight
A unique pointer to store Weight values.
Definition: FullyConnectedLayer.hpp:19

armnn::Optional
Definition: Optional.hpp:270

armnn::ComparisonOperation::Equal

armnn::Network::AddResizeBilinearLayer
IConnectableLayer * AddResizeBilinearLayer(const ResizeBilinearDescriptor &resizeDesc, const char *name=nullptr) override
Adds a resize bilinear layer to the network.
Definition: Network.cpp:1488

armnn::IBackendInternal
Definition: IBackendInternal.hpp:68

armnn::Network::AddFillLayer
IConnectableLayer * AddFillLayer(const FillDescriptor &fillDescriptor, const char *name=nullptr) override
Add an Fill layer to the network.
Definition: Network.cpp:1209

armnn::Network::AddMeanLayer
IConnectableLayer * AddMeanLayer(const MeanDescriptor &meanDescriptor, const char *name=nullptr) override
Add a Mean layer to the network.
Definition: Network.cpp:1709

armnn::ReshapeDescriptor
A ReshapeDescriptor for the ReshapeLayer.
Definition: Descriptors.hpp:815

armnn::CalculateSlotOption
ITensorHandleFactory::FactoryId CalculateSlotOption(BackendsMap &backends, OutputSlot &outputSlot, TensorHandleFactoryRegistry &registry)
Definition: Network.cpp:751

armnn::optimizations::OptimizeInverseTransposes
OptimizeForConnection< TransposeLayer, TransposeLayer, OptimizeInversePermutesImpl< TransposeLayer > > OptimizeInverseTransposes
Definition: OptimizeInversePermutes.hpp:45

armnn::QuantizedLstmInputParams::GetRecurrentToForgetWeights
const ConstTensor & GetRecurrentToForgetWeights() const
Definition: QuantizedLstmParams.hpp:83

armnn::optimizations::TransposeAndBatchToSpaceAsDepthToSpace
OptimizeForConnection< TransposeLayer, BatchToSpaceNdLayer, PermuteAndBatchToSpaceAsDepthToSpaceImpl< TransposeLayer > > TransposeAndBatchToSpaceAsDepthToSpace
Definition: PermuteAndBatchToSpaceAsDepthToSpace.hpp:104

armnn::LstmInputParams::m_CellToOutputWeights
const ConstTensor * m_CellToOutputWeights
Definition: LstmParams.hpp:50

ARMNN_NO_DEPRECATE_WARN_BEGIN
#define ARMNN_NO_DEPRECATE_WARN_BEGIN
Definition: Deprecated.hpp:33

WorkloadFactory.hpp

armnn::TensorInfo
Definition: Tensor.hpp:152

armnn::CalculateSlotOptionForOutput
ITensorHandleFactory::FactoryId CalculateSlotOptionForOutput(BackendsMap &backends, OutputSlot &slot, TensorHandleFactoryRegistry &registry)
Definition: Network.cpp:741

armnn::ComparisonDescriptor
A ComparisonDescriptor for the ComparisonLayer.
Definition: Descriptors.hpp:70

armnn::DepthwiseConvolution2dLayer
This layer represents a depthwise convolution 2d operation.
Definition: DepthwiseConvolution2dLayer.hpp:15

armnnUtils::FloatingPointConverter::ConvertBFloat16ToFloat32
static void ConvertBFloat16ToFloat32(const void *srcBFloat16Buffer, size_t numElements, float *dstFloat32Buffer)
Definition: FloatingPointConverter.cpp:61

armnn::RequiresCopy
bool RequiresCopy(ITensorHandleFactory::FactoryId src, ITensorHandleFactory::FactoryId dst, TensorHandleFactoryRegistry &registry)
Definition: Network.cpp:639

armnn::ResizeBilinearDescriptor::m_TargetWidth
uint32_t m_TargetWidth
Target width value.
Definition: Descriptors.hpp:765

armnn::ResizeBilinearDescriptor::m_DataLayout
DataLayout m_DataLayout
The data layout to be used (NCHW, NHWC).
Definition: Descriptors.hpp:769

armnn::Network::AddLogSoftmaxLayer
IConnectableLayer * AddLogSoftmaxLayer(const LogSoftmaxDescriptor &logSoftmaxDescriptor, const char *name=nullptr) override
Adds a log softmax layer to the network.
Definition: Network.cpp:1520

armnn::QuantizedLstmInputParams::GetCellBias
const ConstTensor & GetCellBias() const
Definition: QuantizedLstmParams.hpp:108

armnn::Convolution2dDescriptor
A Convolution2dDescriptor for the Convolution2dLayer.
Definition: Descriptors.hpp:400

armnn::OutputSlot::GetOwningLayer
Layer & GetOwningLayer() const
Definition: Layer.hpp:115

armnn::EdgeStrategy::CopyToTarget
Source backends tensor data can be exported to destination backend tensor without copy...

armnn::Network::AddDepthwiseConvolution2dLayer
IConnectableLayer * AddDepthwiseConvolution2dLayer(const DepthwiseConvolution2dDescriptor &convolution2dDescriptor, const ConstTensor &weights, const Optional< ConstTensor > &biases, const char *name=nullptr) override
Adds a 2D depthwise convolution layer to the network.
Definition: Network.cpp:1344

armnn::ConvertFp16ToFp32Layer
This layer converts data type Float 16 to Float 32.
Definition: ConvertFp16ToFp32Layer.hpp:14

armnn::TransposeConvolution2dDescriptor::m_BiasEnabled
bool m_BiasEnabled
Enable/disable bias.
Definition: Descriptors.hpp:1237

armnn::LstmInputParams::m_CellToInputWeights
const ConstTensor * m_CellToInputWeights
Definition: LstmParams.hpp:48

armnn::Network::GetGraph
const Graph & GetGraph() const
Definition: Network.hpp:34

armnn::LayerType::Output

armnn::Network::AddSwitchLayer
IConnectableLayer * AddSwitchLayer(const char *name=nullptr) override
Adds a switch layer to the network.
Definition: Network.cpp:1767

armnn::ResizeDescriptor::m_Method
ResizeMethod m_Method
The Interpolation method to use (Bilinear, NearestNeighbor).
Definition: Descriptors.hpp:804

armnn::Network::AddFloorLayer
IConnectableLayer * AddFloorLayer(const char *name=nullptr) override
Adds a floor layer to the network.
Definition: Network.cpp:1553

armnn::Optimizer::Pass
static void Pass(Graph &graph, const Optimizations &optimizations)
Definition: Optimizer.cpp:16

armnn::LstmInputParams::m_InputGateBias
const ConstTensor * m_InputGateBias
Definition: LstmParams.hpp:51

armnn::SpaceToDepthLayer
This layer represents a SpaceToDepth operation.
Definition: SpaceToDepthLayer.hpp:14

armnn::Network::AddInputLayer
IConnectableLayer * AddInputLayer(LayerBindingId id, const char *name=nullptr) override
Adds an input layer to the network.
Definition: Network.cpp:1186

armnn::ReshapeLayer
This layer represents a reshape operation.
Definition: ReshapeLayer.hpp:15

armnn::LayerType::ConvertFp32ToFp16

armnn::QuantizedLstmParameters::m_InputToInputWeights
std::unique_ptr< ScopedCpuTensorHandle > m_InputToInputWeights
A unique pointer to represent 2D weights tensor with dimensions [outputSize, inputSize] (QAsymm8)...
Definition: QuantizedLstmLayer.hpp:17

armnn::ActivationFunction::Abs

ARMNN_LOG
#define ARMNN_LOG(severity)
Definition: Logging.hpp:163

armnn::QLstmBasicParameters::m_InputToForgetWeights
std::unique_ptr< ScopedCpuTensorHandle > m_InputToForgetWeights
A unique pointer to represent 2D weights tensor with dimensions [num_units, inputSize] (QSymmS8)...
Definition: QLstmLayer.hpp:17

armnn::INetwork
Main network class which provides the interface for building up a neural network. ...
Definition: INetwork.hpp:105

armnn::ActivationLayer
This layer represents an activation operation with the specified activation function.
Definition: ActivationLayer.hpp:12

armnn::OptimizationViews
Definition: OptimizationViews.hpp:13

armnn::BackendRegistryInstance
BackendRegistry & BackendRegistryInstance()
Definition: BackendRegistry.cpp:13

armnn::ConvertBf16ToFp32Layer
This layer converts data type BFloat16 to Float32.
Definition: ConvertBf16ToFp32Layer.hpp:14

armnn::LayerType::FullyConnected

armnn::LstmInputParams::m_RecurrentToCellWeights
const ConstTensor * m_RecurrentToCellWeights
Definition: LstmParams.hpp:46

armnn::ConvertBf16ToFp32Weight
LayerT * ConvertBf16ToFp32Weight(Layer *l)
Definition: Network.cpp:151

armnn::NetworkOptions
std::vector< BackendOptions > NetworkOptions
Definition: BackendOptions.hpp:15

armnn::Network::Accept
void Accept(ILayerVisitor &visitor) const override
Definition: Network.cpp:1998

armnn::OptimizerOptions::m_ReduceFp32ToBf16
bool m_ReduceFp32ToBf16
Definition: INetwork.hpp:654

armnn::Network::AddMinimumLayer
IConnectableLayer * AddMinimumLayer(const char *name=nullptr) override
Add a Minimum layer to the network.
Definition: Network.cpp:1435

armnn::StandInLayer
This layer represents an unknown operation in the input graph.
Definition: StandInLayer.hpp:14

BackendSettings.hpp

armnn::optimizations::SquashEqualReshapeSiblings
OptimizeForConnection< Layer, ReshapeLayer, SquashEqualSiblingsImpl< ReshapeLayer > > SquashEqualReshapeSiblings
Definition: SquashEqualSiblings.hpp:70

armnn::OptimizedNetwork::GetGraph
Graph & GetGraph()
Definition: Network.hpp:289

armnn::DetectionPostProcessLayer
This layer represents a detection postprocess operator.
Definition: DetectionPostProcessLayer.hpp:16

armnn::SubgraphView::end
Iterator end()
Definition: SubgraphView.cpp:170

armnn::BackendSettings::m_SupportedBackends
BackendIdSet m_SupportedBackends
Definition: BackendSettings.hpp:21

armnn::LstmInputParams::m_ForgetLayerNormWeights
const ConstTensor * m_ForgetLayerNormWeights
Definition: LstmParams.hpp:58

armnn::optimizations::MoveTransposeUp
OptimizeForConnection< Layer, TransposeLayer, MoveTransposeUpImpl > MoveTransposeUp
Definition: MoveTransposeUp.hpp:77

armnn::LstmInputParams::m_CellToForgetWeights
const ConstTensor * m_CellToForgetWeights
Definition: LstmParams.hpp:49

armnn::ReturnWithError
OptimizationResult ReturnWithError(OptimizationResult res, const Layer *layer, const BackendSettings &backendSettings, Optional< std::vector< std::string > &> errMessages)
Definition: Network.cpp:100

armnn::TransposeConvolution2dLayer::m_Weight
std::unique_ptr< ScopedCpuTensorHandle > m_Weight
A unique pointer to store weight values.
Definition: TransposeConvolution2dLayer.hpp:19

armnn
Copyright (c) 2020 ARM Limited.
Definition: 00_introduction.dox:25

armnn::Network::AddQLstmLayer
IConnectableLayer * AddQLstmLayer(const QLstmDescriptor &descriptor, const LstmInputParams &params, const char *name=nullptr) override
Add a QLstm layer to the network.
Definition: Network.cpp:1856

armnn::PadLayer
This layer represents a pad operation.
Definition: PadLayer.hpp:14

armnn::LstmLayer
This layer represents a LSTM operation.
Definition: LstmLayer.hpp:77

armnn::IgnoreUnused
void IgnoreUnused(Ts &&...)
Definition: IgnoreUnused.hpp:14

armnn::optimizations::FoldPadIntoConvolution2d
OptimizeForConnection< PadLayer, Convolution2dLayer, FoldPadIntoConvolution2dImpl > FoldPadIntoConvolution2d
Definition: FoldPadIntoConvolution2d.hpp:88

armnn::QuantizedLstmInputParams
Definition: QuantizedLstmParams.hpp:13

armnn::Layer::SetBackendId
void SetBackendId(const BackendId &id)
Definition: Layer.hpp:266

armnn::BackendSettings::IsBackendSupported
bool IsBackendSupported(const BackendId &backend) const
Definition: BackendSettings.hpp:46

armnn::Graph::Iterator
LayerList::const_iterator Iterator
Definition: Graph.hpp:51

armnn::Network::AddFullyConnectedLayer
IConnectableLayer * AddFullyConnectedLayer(const FullyConnectedDescriptor &fullyConnectedDescriptor, const ConstTensor &weights, const Optional< ConstTensor > &biases, const char *name=nullptr) override
Adds a fully connected layer to the network.
Definition: Network.cpp:1237

armnn::SpaceToDepthDescriptor
A SpaceToDepthDescriptor for the SpaceToDepthLayer.
Definition: Descriptors.hpp:867

armnn::OptionalReferenceSwitch< std::is_reference< T >::value, T >::value
const T & value() const
Definition: Optional.hpp:146

armnn::PermuteLayer
This layer represents a permutation operation.
Definition: PermuteLayer.hpp:15

armnn::QuantizedLstmInputParams::GetInputToOutputWeights
const ConstTensor & GetInputToOutputWeights() const
Definition: QuantizedLstmParams.hpp:73

armnn::Layer::GetNumOutputSlots
unsigned int GetNumOutputSlots() const override
Returns the number of connectable output slots.
Definition: Layer.hpp:310

armnn::SpaceToBatchNdLayer
This layer represents a SpaceToBatchNd operation.
Definition: SpaceToBatchNdLayer.hpp:14

armnn::Network::AddRsqrtLayer
IConnectableLayer * AddRsqrtLayer(const char *name=nullptr) override
Add Reciprocal of square root layer to the network.
Definition: Network.cpp:1745

armnn::BatchToSpaceNdDescriptor
A BatchToSpaceNdDescriptor for the BatchToSpaceNdLayer.
Definition: Descriptors.hpp:665

armnn::optimizations::InsertDebugLayer
OptimizeForType< Layer, AddDebugImpl > InsertDebugLayer
Definition: AddDebug.hpp:34

BackendRegistry.hpp

armnn::optimizations::OptimizeConsecutiveReshapes
OptimizeForConnection< ReshapeLayer, ReshapeLayer, OptimizeConsecutiveReshapesImpl > OptimizeConsecutiveReshapes
Definition: OptimizeConsecutiveReshapes.hpp:61

armnn::LayerBindingId
int LayerBindingId
Type of identifiers for bindable layers (inputs, outputs).
Definition: Types.hpp:194

armnn::LstmInputParams::m_OutputGateBias
const ConstTensor * m_OutputGateBias
Definition: LstmParams.hpp:54

armnn::ElementwiseUnaryLayer
This layer represents a elementwiseUnary operation.
Definition: ElementwiseUnaryLayer.hpp:14

armnn::GetDataTypeName
constexpr const char * GetDataTypeName(DataType dataType)
Definition: TypesUtils.hpp:168

Optimizer.hpp

armnn::ResizeDescriptor
A ResizeDescriptor for the ResizeLayer.
Definition: Descriptors.hpp:777

armnn::Network::AddEqualLayer
IConnectableLayer * AddEqualLayer(const char *name=nullptr) override
Add a Equal layer to the network.
Definition: Network.cpp:1740

armnn::Network::AddConvolution2dLayer
IConnectableLayer * AddConvolution2dLayer(const Convolution2dDescriptor &convolution2dDescriptor, const ConstTensor &weights, const Optional< ConstTensor > &biases, const char *name=nullptr) override
Adds a 2D convolution layer to the network.
Definition: Network.cpp:1290

armnn::StackDescriptor
A StackDescriptor for the StackLayer.
Definition: Descriptors.hpp:1007

armnn::Network::AddTransposeConvolution2dLayer
IConnectableLayer * AddTransposeConvolution2dLayer(const TransposeConvolution2dDescriptor &descriptor, const ConstTensor &weights, const Optional< ConstTensor > &biases, const char *name=nullptr) override
Adds a 2D transpose convolution layer to the network.
Definition: Network.cpp:1777

armnn::EdgeStrategy::ExportToTarget
Destination backend can work directly with tensors on source backend.

armnn::IBackendInternal::GetHandleFactoryPreferences
virtual std::vector< ITensorHandleFactory::FactoryId > GetHandleFactoryPreferences() const
(Optional) Returns a vector of supported TensorHandleFactory ids in preference order.
Definition: IBackendInternal.cpp:96

armnn::optimizations::OptimizeInverseConversionsFp16
OptimizeForConnection< ConvertFp16ToFp32Layer, ConvertFp32ToFp16Layer, OptimizeInverseConversionsImpl > OptimizeInverseConversionsFp16
Definition: OptimizeInverseConversions.hpp:42

PolymorphicDowncast.hpp

armnn::OptimizerOptions::m_ReduceFp32ToFp16
bool m_ReduceFp32ToFp16
Definition: INetwork.hpp:648

armnn::QuantizeLayer
Definition: QuantizeLayer.hpp:17

armnn::OptimizationResult::IsError
bool IsError() const
Definition: Network.hpp:314

armnn::OptimizedNetwork::~OptimizedNetwork
~OptimizedNetwork()
Definition: Network.cpp:2011

armnn::SubgraphView
The SubgraphView class represents a subgraph of a Graph.
Definition: SubgraphView.hpp:23

armnn::ApplyBackendOptimizations
OptimizationResult ApplyBackendOptimizations(OptimizedNetwork *optNetObjPtr, BackendSettings &backendSettings, BackendsMap &backends, Optional< std::vector< std::string > &> errMessages)
Definition: Network.cpp:541

armnn::PadDescriptor
A PadDescriptor for the PadLayer.
Definition: Descriptors.hpp:958

armnn::InstanceNormalizationLayer
This layer represents an instance normalization operation.
Definition: InstanceNormalizationLayer.hpp:13

armnn::OptimizerOptions::m_Debug
bool m_Debug
Definition: INetwork.hpp:651

std
Definition: BackendId.hpp:147

armnn::optimizations::PermuteAndBatchToSpaceAsDepthToSpace
OptimizeForConnection< PermuteLayer, BatchToSpaceNdLayer, PermuteAndBatchToSpaceAsDepthToSpaceImpl< PermuteLayer > > PermuteAndBatchToSpaceAsDepthToSpace
Definition: PermuteAndBatchToSpaceAsDepthToSpace.hpp:102

armnn::LstmInputParams::m_InputLayerNormWeights
const ConstTensor * m_InputLayerNormWeights
Definition: LstmParams.hpp:57

armnn::optimizations::MovePermuteUp
OptimizeForConnection< Layer, PermuteLayer, MovePermuteUpImpl > MovePermuteUp
Definition: MovePermuteUp.hpp:77

armnn::ConstantLayer::m_LayerOutput
std::unique_ptr< ScopedCpuTensorHandle > m_LayerOutput
Definition: ConstantLayer.hpp:44

armnn::QuantizedLstmInputParams::GetInputToCellWeights
const ConstTensor & GetInputToCellWeights() const
Definition: QuantizedLstmParams.hpp:68

armnn::Network::AddReshapeLayer
IConnectableLayer * AddReshapeLayer(const ReshapeDescriptor &reshapeDescriptor, const char *name=nullptr) override
Adds a reshape layer to the network.
Definition: Network.cpp:1535

TypesUtils.hpp

armnn::LayerType::ConvertFp16ToFp32

armnn::MemorySource::Malloc

armnn::Network::AddTransposeLayer
IConnectableLayer * AddTransposeLayer(const TransposeDescriptor &transposeDescriptor, const char *name=nullptr) override
Adds a transpose layer to the network.
Definition: Network.cpp:1799

armnn::OutputLayer
A layer user-provided data can be bound to (e.g. inputs, outputs).
Definition: OutputLayer.hpp:13

armnn::Graph::ForEachLayer
void ForEachLayer(Func func) const
Definition: Graph.hpp:40

armnn::Status::Success

armnn::ITensorHandleFactory::GetCapabilities
virtual std::vector< Capability > GetCapabilities(const IConnectableLayer *layer, const IConnectableLayer *connectedLayer, CapabilityClass capabilityClass)
Definition: ITensorHandleFactory.hpp:86

armnn::OptimizedNetwork::PrintGraph
Status PrintGraph() override
Definition: Network.cpp:65

armnn::Network::AddMergeLayer
IConnectableLayer * AddMergeLayer(const char *name=nullptr) override
Adds a merge layer to the network.
Definition: Network.cpp:1762

armnn::DequantizeLayer
This layer dequantizes the input tensor.
Definition: DequantizeLayer.hpp:13

armnn::LayerType::ConvertFp32ToBf16

armnn::optimizations::ConvertConstantsFloatToHalf
ConvertConstants< Float32ToFloat16, IsFloat16Layer > ConvertConstantsFloatToHalf
Definition: ConvertConstants.hpp:155

armnn::DataType
DataType
Definition: Types.hpp:32

IBackendInternal.hpp

armnn::optimizations::TransposeAsReshape
OptimizeForType< TransposeLayer, TransposeAsReshapeImpl > TransposeAsReshape
Definition: TransposeAsReshape.hpp:77

armnn::Network::AddMaximumLayer
IConnectableLayer * AddMaximumLayer(const char *name=nullptr) override
Add a Maximum layer to the network.
Definition: Network.cpp:1430

armnn::GatherLayer
This layer represents a Gather operator.
Definition: GatherLayer.hpp:14

armnn::LstmInputParams::m_RecurrentToOutputWeights
const ConstTensor * m_RecurrentToOutputWeights
Definition: LstmParams.hpp:47

armnn::DetectionPostProcessLayer::m_Anchors
std::unique_ptr< ScopedCpuTensorHandle > m_Anchors
A unique pointer to store Anchor values.
Definition: DetectionPostProcessLayer.hpp:20

armnn::FullyConnectedLayer
This layer represents a fully connected operation.
Definition: FullyConnectedLayer.hpp:15

All.hpp

armnn::LstmDescriptor
An LstmDescriptor for the LstmLayer.
Definition: Descriptors.hpp:894

ARMNN_NO_DEPRECATE_WARN_END
#define ARMNN_NO_DEPRECATE_WARN_END
Definition: Deprecated.hpp:34

armnn::Optimize
IOptimizedNetworkPtr Optimize(const INetwork &network, const std::vector< BackendId > &backendPreferences, const IDeviceSpec &deviceSpec, const OptimizerOptions &options=OptimizerOptions(), Optional< std::vector< std::string > &> messages=EmptyOptional())
Create an optimized version of the network.
Definition: Network.cpp:1014

ARMNN_ASSERT_MSG
#define ARMNN_ASSERT_MSG(COND, MSG)
Definition: Assert.hpp:15

armnn::QuantizedLstmLayer
This layer represents a QuantizedLstm operation.
Definition: QuantizedLstmLayer.hpp:45

armnn::GetLayerTypeAsCString
char const  * GetLayerTypeAsCString(LayerType type)
Definition: InternalTypes.cpp:13

armnn::LogSoftmaxLayer
This layer represents a log softmax operation.
Definition: LogSoftmaxLayer.hpp:14

armnn::BatchNormalizationLayer::m_Mean
std::unique_ptr< ScopedCpuTensorHandle > m_Mean
A unique pointer to store Mean values.
Definition: BatchNormalizationLayer.hpp:19

armnn::L2NormalizationDescriptor
A L2NormalizationDescriptor for the L2NormalizationLayer.
Definition: Descriptors.hpp:599

armnn::LstmInputParams::m_ProjectionBias
const ConstTensor * m_ProjectionBias
Definition: LstmParams.hpp:56

Graph.hpp

armnn::TensorInfo::GetQuantizationOffset
int32_t GetQuantizationOffset() const
Definition: Tensor.cpp:470

armnn::ArgMinMaxDescriptor
An ArgMinMaxDescriptor for ArgMinMaxLayer.
Definition: Descriptors.hpp:51

armnn::TensorInfo::GetQuantizationScale
float GetQuantizationScale() const
Definition: Tensor.cpp:453

armnn::TensorInfo::GetDataType
DataType GetDataType() const
Definition: Tensor.hpp:194

armnn::OriginsDescriptor
An OriginsDescriptor for the ConcatLayer.
Definition: Descriptors.hpp:155

armnn::DataType::QAsymmU8

armnn::IOptimizedNetwork
Definition: INetwork.hpp:595

armnn::BoostLogSeverityMapping::warning

armnn::OptionalBase::has_value
bool has_value() const noexcept
Definition: Optional.hpp:53

armnn::OptimizationResult::IsOk
bool IsOk() const
Definition: Network.hpp:312

armnn::FullyConnectedDescriptor
A FullyConnectedDescriptor for the FullyConnectedLayer.
Definition: Descriptors.hpp:381

armnn::Convolution2dLayer::m_Weight
std::unique_ptr< ScopedCpuTensorHandle > m_Weight
A unique pointer to store Weight values.
Definition: Convolution2dLayer.hpp:20

armnn::FullyConnectedDescriptor::m_BiasEnabled
bool m_BiasEnabled
Enable/disable bias.
Definition: Descriptors.hpp:394

armnn::Compute::Undefined

armnn::StackLayer
This layer represents a stack operation.
Definition: StackLayer.hpp:13

armnn::LayerType::Permute

armnn::ConstTensor
A tensor defined by a TensorInfo (shape and data type) and an immutable backing store.
Definition: Tensor.hpp:298

armnn::Network::AddConcatLayer
IConnectableLayer * AddConcatLayer(const ConcatDescriptor &concatDescriptor, const char *name=nullptr) override
Adds a concatenation layer to the network.
Definition: Network.cpp:1262

armnn::OptimizationViews::GetFailedSubgraphs
const Subgraphs & GetFailedSubgraphs() const
Definition: OptimizationViews.hpp:50

armnn::ConcatLayer
This layer represents a merge operation.
Definition: ConcatLayer.hpp:13

armnn::SoftmaxLayer
This layer represents a softmax operation.
Definition: SoftmaxLayer.hpp:13

armnn::LstmInputParams
Definition: LstmParams.hpp:13

armnn::Layer::GetNameStr
const std::string & GetNameStr() const
Definition: Layer.hpp:216

armnn::ResizeDescriptor::m_TargetWidth
uint32_t m_TargetWidth
Target width value.
Definition: Descriptors.hpp:799

armnn::InsertConvertBf16ToFp32LayersBefore
std::vector< ConvertBf16ToFp32Layer * > InsertConvertBf16ToFp32LayersBefore(Graph &graph, Layer &layer, bool expectCorrectInputType)
Definition: NetworkUtils.cpp:51

armnn::GatherDescriptor
A GatherDescriptor for the GatherLayer.
Definition: Descriptors.hpp:734

armnn::LayerType::Convolution2d

armnn::QuantizedLstmInputParams::GetInputToInputWeights
const ConstTensor & GetInputToInputWeights() const
Definition: QuantizedLstmParams.hpp:58

armnn::DataType::Float16

armnn::Status
Status
enumeration
Definition: Types.hpp:26

armnn::LayerType::MemCopy

armnn::BatchToSpaceNdLayer
This layer represents a BatchToSpaceNd operation.
Definition: BatchToSpaceNdLayer.hpp:13

armnn::OutputSlot
Definition: Layer.hpp:83

armnn::SubgraphViewSelector::Subgraphs
std::vector< SubgraphViewPtr > Subgraphs
Definition: SubgraphViewSelector.hpp:25

armnn::IOptimizedNetworkPtr
std::unique_ptr< IOptimizedNetwork, void(*)(IOptimizedNetwork *network)> IOptimizedNetworkPtr
Definition: INetwork.hpp:593

armnn::ResizeDescriptor::m_HalfPixelCenters
bool m_HalfPixelCenters
Half Pixel Centers.
Definition: Descriptors.hpp:810

armnn::Network::AddPadLayer
IConnectableLayer * AddPadLayer(const PadDescriptor &padDescriptor, const char *name=nullptr) override
Adds a fully pad layer to the network.
Definition: Network.cpp:1714

armnn::Network::AddStandInLayer
IConnectableLayer * AddStandInLayer(const StandInDescriptor &descriptor, const char *name=nullptr) override
Add a stand-in layer for a type unknown to the Arm NN framework.
Definition: Network.cpp:1812

armnn::LayerType::Softmax

armnn::TensorInfo::SetQuantizationScale
void SetQuantizationScale(float scale)
Definition: Tensor.cpp:465

armnn::ArgMinMaxLayer
This layer represents a ArgMinMax operation.
Definition: ArgMinMaxLayer.hpp:14

ARMNN_ASSERT
#define ARMNN_ASSERT(COND)
Definition: Assert.hpp:14

armnn::StandInDescriptor
A StandInDescriptor for the StandIn layer.
Definition: Descriptors.hpp:1037

armnn::QLstmDescriptor
A QLstmDescriptor for the QLstmLayer.
Definition: Descriptors.hpp:1136

armnn::Network::AddActivationLayer
IConnectableLayer * AddActivationLayer(const ActivationDescriptor &activationDescriptor, const char *name=nullptr) override
Adds an activation layer to the network.
Definition: Network.cpp:1394

armnn::BackendSettings::GetAvailablePreferredBackends
BackendIdVector GetAvailablePreferredBackends() const
Definition: BackendSettings.hpp:67

armnn::Network::AddSubtractionLayer
IConnectableLayer * AddSubtractionLayer(const char *name=nullptr) override
Adds a subtraction layer to the network.
Definition: Network.cpp:1704

armnn::Network::AddInstanceNormalizationLayer
IConnectableLayer * AddInstanceNormalizationLayer(const InstanceNormalizationDescriptor &desc, const char *name=nullptr) override
Adds an instance normalization layer to the network.
Definition: Network.cpp:1508

armnn::IDeviceSpec
Device specific knowledge to be passed to the optimizer.
Definition: Types.hpp:184

armnn::IWorkloadFactory::IsLayerSupported
static bool IsLayerSupported(const BackendId &backendId, const IConnectableLayer &layer, Optional< DataType > dataType, std::string &outReasonIfUnsupported)
Definition: WorkloadFactory.cpp:42

armnn::OptimizerOptions
Definition: INetwork.hpp:609

armnn::Network::AddDepthToSpaceLayer
IConnectableLayer * AddDepthToSpaceLayer(const DepthToSpaceDescriptor &depthToSpaceDescriptor, const char *name=nullptr) override
Adds a depth to space layer to the network.
Definition: Network.cpp:1338

armnn::OptimizationViews::Validate
bool Validate(const SubgraphView &originalSubgraph) const
Definition: OptimizationViews.cpp:11

armnn::ActivationDescriptor
An ActivationDescriptor for the ActivationLayer.
Definition: Descriptors.hpp:20

armnn::InvalidArgumentException
Definition: Exceptions.hpp:80

armnn::OptimizationResult
Definition: Network.hpp:298

armnn::DataType::BFloat16

armnn::InsertConvertFp32ToBf16LayersAfter
std::vector< ConvertFp32ToBf16Layer * > InsertConvertFp32ToBf16LayersAfter(Graph &graph, Layer &layer)
Definition: NetworkUtils.cpp:168

armnn::Layer::GetBackendId
const BackendId & GetBackendId() const
Definition: Layer.hpp:265

armnn::ResizeBilinearDescriptor::m_TargetHeight
uint32_t m_TargetHeight
Target height value.
Definition: Descriptors.hpp:767

armnn::Network::AddStackLayer
IConnectableLayer * AddStackLayer(const StackDescriptor &stackDescriptor, const char *name=nullptr) override
Adds a stack layer to the network.
Definition: Network.cpp:1805

armnn::FloorLayer
This layer represents a floor operation.
Definition: FloorLayer.hpp:13

armnn::ResizeDescriptor::m_TargetHeight
uint32_t m_TargetHeight
Target height value.
Definition: Descriptors.hpp:801

armnn::SliceDescriptor
A SliceDescriptor for the SliceLayer.
Definition: Descriptors.hpp:984

armnn::Graph
Definition: Graph.hpp:30

armnn::NormalizationLayer
This layer represents a normalization operation.
Definition: NormalizationLayer.hpp:13

armnn::ITensorHandleFactory::GetExportFlags
virtual MemorySourceFlags GetExportFlags() const
Definition: ITensorHandleFactory.hpp:83

armnn::QuantizedLstmInputParams::GetForgetGateBias
const ConstTensor & GetForgetGateBias() const
Definition: QuantizedLstmParams.hpp:103

armnn::Pooling2dLayer
This layer represents a pooling 2d operation.
Definition: Pooling2dLayer.hpp:13

armnn::ConvertFp32ToFp16Layer
This layer converts data type Float 32 to Float 16.
Definition: ConvertFp32ToFp16Layer.hpp:13

armnn::OptimizedNetwork::OptimizedNetwork
OptimizedNetwork(std::unique_ptr< Graph > graph)
Definition: Network.cpp:2006

Logging.hpp

armnn::TransposeLayer
This layer represents a transpose operation.
Definition: TransposeLayer.hpp:15

armnn::OptimizerOptions::m_ImportEnabled
bool m_ImportEnabled
Definition: INetwork.hpp:660

armnn::Network::AddSplitterLayer
IConnectableLayer * AddSplitterLayer(const ViewsDescriptor &splitterDescriptor, const char *name=nullptr) override
Adds a splitter layer to the network.
Definition: Network.cpp:1424

armnn::OptimizationResult::m_Error
bool m_Error
Definition: Network.hpp:301

armnn::TensorHandleFactoryRegistry
Definition: TensorHandleFactoryRegistry.hpp:20

armnn::AdditionLayer
This layer represents an addition operation.
Definition: AdditionLayer.hpp:13

armnn::QLstmLayer::m_BasicParameters
QLstmBasicParameters m_BasicParameters
Definition: QLstmLayer.hpp:83

armnn::Graph::SubstituteSubgraph
void SubstituteSubgraph(SubgraphView &subgraph, IConnectableLayer *substituteLayer)
Substitutes the given sub-graph with either a new layer or a new sub-graph.
Definition: Graph.cpp:395

armnn::Network::PrintGraph
Status PrintGraph() override
Definition: Network.cpp:1180

armnn::Network::AddSpaceToDepthLayer
IConnectableLayer * AddSpaceToDepthLayer(const SpaceToDepthDescriptor &spaceToDepthDescriptor, const char *name=nullptr) override
Adds a space to depth layer to the network.
Definition: Network.cpp:1547

armnn::CheckScaleSetOnQuantizedType
bool CheckScaleSetOnQuantizedType(Layer *layer, Optional< std::vector< std::string > &> errMessages)
Definition: Network.cpp:115

armnn::Network
Private implementation of INetwork.
Definition: Network.hpp:28

CpuTensorHandle.hpp

armnn::LstmInputParams::m_CellLayerNormWeights
const ConstTensor * m_CellLayerNormWeights
Definition: LstmParams.hpp:59

armnn::OutputSlot::SetTensorHandleFactory
void SetTensorHandleFactory(const ITensorHandleFactory::FactoryId &id)
Definition: Layer.cpp:172

armnn::LstmInputParams::m_ForgetGateBias
const ConstTensor * m_ForgetGateBias
Definition: LstmParams.hpp:52

armnn::SpaceToBatchNdDescriptor
A SpaceToBatchNdDescriptor for the SpaceToBatchNdLayer.
Definition: Descriptors.hpp:835

armnn::LstmInputParams::m_InputToCellWeights
const ConstTensor * m_InputToCellWeights
Definition: LstmParams.hpp:42

armnn::SliceLayer
Definition: SliceLayer.hpp:13

armnn::Network::AddPreluLayer
IConnectableLayer * AddPreluLayer(const char *name=nullptr) override
Adds a PReLU layer to the network.
Definition: Network.cpp:1772

armnn::optimizations::PermuteAsReshape
OptimizeForType< PermuteLayer, PermuteAsReshapeImpl > PermuteAsReshape
Definition: PermuteAsReshape.hpp:66

armnn::OptimizationResult::IsWarningOnly
bool IsWarningOnly() const
Definition: Network.hpp:313

armnn::LstmInputParams::m_InputToOutputWeights
const ConstTensor * m_InputToOutputWeights
Definition: LstmParams.hpp:43

armnn::CapabilityClass::PaddingRequired

armnn::optimizations::SquashEqualTransposeSiblings
OptimizeForConnection< Layer, TransposeLayer, SquashEqualSiblingsImpl< TransposeLayer > > SquashEqualTransposeSiblings
Definition: SquashEqualSiblings.hpp:69

armnn::EdgeStrategy
EdgeStrategy
Definition: ITensorHandleFactory.hpp:97

armnn::QLstmLayer
This layer represents a QLstm operation.
Definition: QLstmLayer.hpp:79

armnn::Network::AddQuantizeLayer
IConnectableLayer * AddQuantizeLayer(const char *name=nullptr) override
Add a quantize layer to the network.
Definition: Network.cpp:1719

armnn::QuantizedLstmInputParams::GetInputGateBias
const ConstTensor & GetInputGateBias() const
Definition: QuantizedLstmParams.hpp:98

armnn::OptimizationViews::GetSubstitutions
const Substitutions & GetSubstitutions() const
Definition: OptimizationViews.hpp:49

armnn::Network::AddArgMinMaxLayer
IConnectableLayer * AddArgMinMaxLayer(const ArgMinMaxDescriptor &desc, const char *name=nullptr) override
Adds an ArgMinMax layer to the network.
Definition: Network.cpp:1400

armnn::BackendSettings::m_PreferredBackends
BackendIdVector m_PreferredBackends
Definition: BackendSettings.hpp:20

armnn::LayerType::Constant

armnn::AssignBackends
OptimizationResult AssignBackends(OptimizedNetwork *optNetObjPtr, BackendSettings &backendSettings, Graph::Iterator &firstLayer, Graph::Iterator &lastLayer, Optional< std::vector< std::string > &> errMessages)
Definition: Network.cpp:382

Assert.hpp

armnn::SubtractionLayer
This layer represents a subtraction operation.
Definition: SubtractionLayer.hpp:14

armnn::profiling::ProfilingService
Definition: ProfilingService.hpp:49

armnn::SwitchLayer
This layer calculates both true and false outputs for input.
Definition: SwitchLayer.hpp:13

armnn::ScopedCpuTensorHandle
Definition: CpuTensorHandle.hpp:106

Layer.hpp

armnn::EmptyOptional
EmptyOptional is used to initialize the Optional class in case we want to have default value for an O...
Definition: Optional.hpp:32

armnn::optimizations::ConvertConstantsHalfToFloat
ConvertConstants< Float16ToFloat32, IsFloat32Layer > ConvertConstantsHalfToFloat
Definition: ConvertConstants.hpp:154

armnn::ResizeDescriptor::m_AlignCorners
bool m_AlignCorners
Aligned corners.
Definition: Descriptors.hpp:808

armnn::ElementwiseUnaryDescriptor
A ElementwiseUnaryDescriptor for the ElementwiseUnaryLayer.
Definition: Descriptors.hpp:90

armnn::Network::AddBatchNormalizationLayer
IConnectableLayer * AddBatchNormalizationLayer(const BatchNormalizationDescriptor &desc, const ConstTensor &mean, const ConstTensor &variance, const ConstTensor &beta, const ConstTensor &gamma, const char *name=nullptr) override
Adds a batch normalization layer to the network.
Definition: Network.cpp:1466

armnn::LstmInputParams::m_RecurrentToForgetWeights
const ConstTensor * m_RecurrentToForgetWeights
Definition: LstmParams.hpp:45

armnn::SubgraphViewSelector::SelectSubgraphs
static Subgraphs SelectSubgraphs(Graph &graph, const LayerSelectorFunction &selector)
Selects subgraphs from a graph based on the selector function and the algorithm.
Definition: SubgraphViewSelector.cpp:255

armnn::Network::AddBatchToSpaceNdLayer
IConnectableLayer * AddBatchToSpaceNdLayer(const BatchToSpaceNdDescriptor &batchToSpaceNdDescriptor, const char *name=nullptr) override
Adds a batch to space ND layer to the network.
Definition: Network.cpp:1191

armnn::L2NormalizationLayer
This layer represents a L2 normalization operation.
Definition: L2NormalizationLayer.hpp:13

armnn::CreateSupportedBackends
BackendsMap CreateSupportedBackends(TensorHandleFactoryRegistry &handleFactoryRegistry, BackendSettings &backendSettings)
Definition: Network.cpp:522

armnn::optimizations::OptimizeInverseConversionsFp32
OptimizeForConnection< ConvertFp32ToFp16Layer, ConvertFp16ToFp32Layer, OptimizeInverseConversionsImpl > OptimizeInverseConversionsFp32
Definition: OptimizeInverseConversions.hpp:44

armnn::CalculateSlotOptionForInput
ITensorHandleFactory::FactoryId CalculateSlotOptionForInput(BackendsMap &backends, OutputSlot &slot, TensorHandleFactoryRegistry &registry)
Definition: Network.cpp:659

armnn::BoostLogSeverityMapping::info

Exceptions.hpp

armnn::BackendId::Get
const std::string & Get() const
Definition: BackendId.hpp:136

armnn::ResizeMethod::Bilinear

armnn::OptimizedNetwork::SerializeToDot
Status SerializeToDot(std::ostream &stream) const override
Definition: Network.cpp:71

armnn::ITensorHandleFactory
Definition: ITensorHandleFactory.hpp:41

armnn::Network::AddAdditionLayer
IConnectableLayer * AddAdditionLayer(const char *name=nullptr) override
Adds an addition layer to the network.
Definition: Network.cpp:1451

armnn::BackendSettings::m_SelectedBackends
BackendIdSet m_SelectedBackends
Definition: BackendSettings.hpp:22

armnn::Network::AddDequantizeLayer
IConnectableLayer * AddDequantizeLayer(const char *name=nullptr) override
Adds a Dequantize layer to the network.
Definition: Network.cpp:1724

armnn::InputLayer
A layer user-provided data can be bound to (e.g. inputs, outputs).
Definition: InputLayer.hpp:13

armnn::QuantizedLstmInputParams::GetRecurrentToCellWeights
const ConstTensor & GetRecurrentToCellWeights() const
Definition: QuantizedLstmParams.hpp:88

Network.hpp

armnn::Network::AddSpaceToBatchNdLayer
IConnectableLayer * AddSpaceToBatchNdLayer(const SpaceToBatchNdDescriptor &spaceToBatchNdDescriptor, const char *name=nullptr) override
Adds a space to batch layer to the network.
Definition: Network.cpp:1541

armnn::AttemptBackendAssignment
OptimizationResult AttemptBackendAssignment(BackendSettings &backendSettings, Graph &graph, Layer *layer, BackendId backend, DataType dataTypeIn, DataType dataTypeOut, const std::vector< BackendId > &availablePreferredBackends, std::string &reasonIfUnsupported, Optional< std::vector< std::string > &> errMessages)
Definition: Network.cpp:174

armnn::QuantizedLstmInputParams::GetInputToForgetWeights
const ConstTensor & GetInputToForgetWeights() const
Definition: QuantizedLstmParams.hpp:63

armnn::TensorHandleFactoryRegistry::GetFactory
ITensorHandleFactory * GetFactory(ITensorHandleFactory::FactoryId id) const
Find a TensorHandleFactory by Id Returns nullptr if not found.
Definition: TensorHandleFactoryRegistry.cpp:39

armnn::OutputSlot::SetTensorInfo
void SetTensorInfo(const TensorInfo &tensorInfo) override
Definition: Layer.cpp:58

armnn::LayerType::Input

armnn::Network::AddAbsLayer
IConnectableLayer * AddAbsLayer(const char *name=nullptr) override
Add absolute layer to the network.
Definition: Network.cpp:1446

armnn::MeanDescriptor
A MeanDescriptor for the MeanLayer.
Definition: Descriptors.hpp:934

armnn::LstmInputParams::m_RecurrentToInputWeights
const ConstTensor * m_RecurrentToInputWeights
Definition: LstmParams.hpp:44

armnn::ITensorHandleFactory::FactoryId
std::string FactoryId
Definition: ITensorHandleFactory.hpp:44

armnn::DivisionLayer
This layer represents a division operation.
Definition: DivisionLayer.hpp:14

armnn::ILayerVisitor
Definition: ILayerVisitor.hpp:16

armnn::Network::AddSliceLayer
IConnectableLayer * AddSliceLayer(const SliceDescriptor &sliceDescriptor, const char *name=nullptr) override
Adds a slice layer to the network.
Definition: Network.cpp:1413

armnn::StridedSliceLayer
This layer represents a strided slice operation.
Definition: StridedSliceLayer.hpp:13

armnn::Layer::GetType
LayerType GetType() const
Definition: Layer.hpp:261

armnn::Network::AddGreaterLayer
IConnectableLayer * AddGreaterLayer(const char *name=nullptr) override
Add a Greater layer to the network.
Definition: Network.cpp:1735

armnn::MaximumLayer
This layer represents a maximum operation.
Definition: MaximumLayer.hpp:14

armnn::Layer::GetOutputSlot
const OutputSlot & GetOutputSlot(unsigned int index=0) const override
Get the const output slot handle by slot index.
Definition: Layer.hpp:314

armnn::QuantizedLstmInputParams::GetRecurrentToInputWeights
const ConstTensor & GetRecurrentToInputWeights() const
Definition: QuantizedLstmParams.hpp:78

armnn::Network::AddMergerLayer
IConnectableLayer * AddMergerLayer(const MergerDescriptor &mergerDescriptor, const char *name=nullptr) override
Adds a concat layer to the network.
Definition: Network.cpp:1440

armnn::optimizations::Fp32NetworkToFp16Converter
OptimizeForType< Layer, ConvertFp32NetworkToFp16Impl > Fp32NetworkToFp16Converter
Definition: ConvertFp32NetworkToFp16.hpp:78

armnn::Network::AddResizeLayer
IConnectableLayer * AddResizeLayer(const ResizeDescriptor &resizeDescriptor, const char *name=nullptr) override
Adds a resize layer to the network.
Definition: Network.cpp:1502

armnn::Network::AddConstantLayer
IConnectableLayer * AddConstantLayer(const ConstTensor &input, const char *name=nullptr) override
Adds a layer with no inputs and a single output, which always corresponds to the passed in constant t...
Definition: Network.cpp:1526

armnn::PreluLayer
Definition: PreluLayer.hpp:14

armnn::TransposeDescriptor
A TransposeDescriptor for the TransposeLayer.
Definition: Descriptors.hpp:1246

armnn::StridedSliceDescriptor
A StridedSliceDescriptor for the StridedSliceLayer.
Definition: Descriptors.hpp:1059

armnn::DataType::Float32

armnn::Network::AddMultiplicationLayer
IConnectableLayer * AddMultiplicationLayer(const char *name=nullptr) override
Adds a multiplication layer to the network.
Definition: Network.cpp:1456

armnn::SelectTensorHandleStrategy
OptimizationResult SelectTensorHandleStrategy(Graph &optGraph, BackendsMap &backends, TensorHandleFactoryRegistry &registry, bool importEnabled, Optional< std::vector< std::string > &> errMessages)
Definition: Network.cpp:946

armnn::Network::AddComparisonLayer
IConnectableLayer * AddComparisonLayer(const ComparisonDescriptor &comparisonDescriptor, const char *name=nullptr) override
Add a Comparison layer to the network.
Definition: Network.cpp:1197

armnn::SubgraphView::begin
Iterator begin()
Definition: SubgraphView.cpp:165

armnn::ReportWarning
void ReportWarning(const std::string &warningMessage, Optional< std::vector< std::string > &> warningMessages)
Definition: Network.cpp:88

armnn::Convolution2dLayer
This layer represents a convolution 2d operation.
Definition: Convolution2dLayer.hpp:15

armnn::ConvertFp32ToBf16Layer
This layer converts data type Float32 to BFloat16.
Definition: ConvertFp32ToBf16Layer.hpp:14

armnn::CheckFlag
bool CheckFlag(MemorySourceFlags flags, MemorySource source)
Definition: MemorySources.hpp:47

armnn::TensorInfo::SetQuantizationOffset
void SetQuantizationOffset(int32_t offset)
Definition: Tensor.cpp:481

armnn::INetwork::CreateRaw
static INetwork * CreateRaw(NetworkOptions networkOptions={})
Definition: Network.cpp:45

armnn::MeanLayer
This layer represents a mean operation.
Definition: MeanLayer.hpp:14

armnn::ComparisonLayer
This layer represents a comparison operation.
Definition: ComparisonLayer.hpp:14

armnn::INetworkPtr
std::unique_ptr< INetwork, void(*)(INetwork *network)> INetworkPtr
Definition: INetwork.hpp:101

armnn::Network::AddNormalizationLayer
IConnectableLayer * AddNormalizationLayer(const NormalizationDescriptor &normalizationDescriptor, const char *name=nullptr) override
Adds a normalization layer to the network.
Definition: Network.cpp:1406

armnn::DepthwiseConvolution2dLayer::m_Weight
std::unique_ptr< ScopedCpuTensorHandle > m_Weight
A unique pointer to store Weight values.
Definition: DepthwiseConvolution2dLayer.hpp:19

armnn::Pooling2dDescriptor
A Pooling2dDescriptor for the Pooling2dLayer.
Definition: Descriptors.hpp:321

armnn::MergeLayer
This layer dequantizes the input tensor.
Definition: MergeLayer.hpp:13

armnn::LstmInputParams::m_OutputLayerNormWeights
const ConstTensor * m_OutputLayerNormWeights
Definition: LstmParams.hpp:60

armnn::BackendSettings
Definition: BackendSettings.hpp:18

armnn::UnaryOperation::Rsqrt

armnn::NormalizationDescriptor
A NormalizationDescriptor for the NormalizationLayer.
Definition: Descriptors.hpp:559

armnn::Network::AddPermuteLayer
IConnectableLayer * AddPermuteLayer(const PermuteDescriptor &permuteDescriptor, const char *name=nullptr) override
Adds a permute layer to the network.
Definition: Network.cpp:1382

armnn::RankLayer
Definition: RankLayer.hpp:13

armnn::ResizeDescriptor::m_DataLayout
DataLayout m_DataLayout
The data layout to be used (NCHW, NHWC).
Definition: Descriptors.hpp:806

armnn::DetectionPostProcessDescriptor
Definition: Descriptors.hpp:503

armnn::InstanceNormalizationDescriptor
An InstanceNormalizationDescriptor for InstanceNormalizationLayer.
Definition: Descriptors.hpp:637

armnn::MultiplicationLayer
This layer represents a multiplication operation.
Definition: MultiplicationLayer.hpp:14

armnn::Network::AddGatherLayer
IConnectableLayer * AddGatherLayer(const char *name=nullptr) override
Add Gather layer to the network.
Definition: Network.cpp:1750

armnn::Network::AddSoftmaxLayer
IConnectableLayer * AddSoftmaxLayer(const SoftmaxDescriptor &softmaxDescriptor, const char *name=nullptr) override
Adds a softmax layer to the network.
Definition: Network.cpp:1418

armnn::Network::AddLstmLayer
IConnectableLayer * AddLstmLayer(const LstmDescriptor &descriptor, const LstmInputParams &params, const char *name=nullptr) override
Add a Lstm layer to the network.
Definition: Network.cpp:1558

armnn::ResizeBilinearDescriptor
A ResizeBilinearDescriptor for the ResizeBilinearLayer.
Definition: Descriptors.hpp:754

SubgraphViewSelector.hpp

armnn::Network::AddElementwiseUnaryLayer
IConnectableLayer * AddElementwiseUnaryLayer(const ElementwiseUnaryDescriptor &elementwiseUnaryDescriptor, const char *name=nullptr) override
Add an ElementwiseUnary layer to the network.
Definition: Network.cpp:1203

armnn::OutputSlot::GetTensorInfo
const TensorInfo & GetTensorInfo() const override
Definition: Layer.cpp:63

armnn::INetwork::Create
static INetworkPtr Create(NetworkOptions networkOptions={})
Definition: Network.cpp:50

armnn::Network::AddDivisionLayer
IConnectableLayer * AddDivisionLayer(const char *name=nullptr) override
Adds a division layer to the network.
Definition: Network.cpp:1699

armnn::CalculateEdgeStrategy
EdgeStrategy CalculateEdgeStrategy(BackendsMap &backends, ITensorHandleFactory::FactoryId srcFactoryId, const Layer &layer, const Layer &connectedLayer, TensorHandleFactoryRegistry &registry, bool importEnabled)
Definition: Network.cpp:860

armnn::IOptimizedNetwork::Destroy
static void Destroy(IOptimizedNetwork *network)
Definition: Network.cpp:60

armnn::ITensorHandleFactory::GetImportFlags
virtual MemorySourceFlags GetImportFlags() const
Definition: ITensorHandleFactory.hpp:84

armnn::LstmBasicParameters::m_InputToForgetWeights
std::unique_ptr< ScopedCpuTensorHandle > m_InputToForgetWeights
A unique pointer to represent 2D weights tensor with dimensions [input_size, num_units].
Definition: LstmLayer.hpp:57

armnn::optimizations::Fp32NetworkToBf16Converter
OptimizeForType< Layer, ConvertFp32NetworkToBf16Impl > Fp32NetworkToBf16Converter
Definition: ConvertFp32NetworkToBf16.hpp:74

armnn::Network::AddStridedSliceLayer
IConnectableLayer * AddStridedSliceLayer(const StridedSliceDescriptor &stridedSliceDescriptor, const char *name=nullptr) override
Adds a strided slice layer to the network.
Definition: Network.cpp:1729

armnn::SoftmaxDescriptor
A SoftmaxDescriptor for the SoftmaxLayer.
Definition: Descriptors.hpp:131

TensorHandleFactoryRegistry.hpp

armnn::BackendSettings::IsCpuRefUsed
bool IsCpuRefUsed() const
Definition: BackendSettings.hpp:61

armnn::Network::AddQuantizedLstmLayer
IConnectableLayer * AddQuantizedLstmLayer(const QuantizedLstmInputParams &params, const char *name=nullptr) override
Add a QuantizedLstm layer to the network.
Definition: Network.cpp:1818

armnn::QuantizedLstmInputParams::GetOutputGateBias
const ConstTensor & GetOutputGateBias() const
Definition: QuantizedLstmParams.hpp:113

armnn::ITensorHandleFactory::LegacyFactoryId
static const FactoryId LegacyFactoryId
Definition: ITensorHandleFactory.hpp:45

armnn::FillLayer
This layer represents a fill operation.
Definition: FillLayer.hpp:13

armnn::Network::AddDetectionPostProcessLayer
IConnectableLayer * AddDetectionPostProcessLayer(const DetectionPostProcessDescriptor &descriptor, const ConstTensor &anchors, const char *name=nullptr) override
Adds a Detection PostProcess layer to the network.
Definition: Network.cpp:1372

armnn::DepthwiseConvolution2dDescriptor
A DepthwiseConvolution2dDescriptor for the DepthwiseConvolution2dLayer.
Definition: Descriptors.hpp:452

armnn::Layer
Definition: Layer.hpp:209

armnn::FillDescriptor
A FillDescriptor for the FillLayer.
Definition: Descriptors.hpp:715

armnn::DepthToSpaceLayer
This layer represents a DepthToSpace operation.
Definition: DepthToSpaceLayer.hpp:14

armnn::BatchNormalizationDescriptor
A BatchNormalizationDescriptor for the BatchNormalizationLayer.
Definition: Descriptors.hpp:618

armnn::LayerType::ConvertBf16ToFp32

armnn::TensorInfo::GetNumElements
unsigned int GetNumElements() const
Definition: Tensor.hpp:192

armnn::Network::Network
Network(NetworkOptions networkOptions={})
Definition: Network.cpp:1171

armnn::LstmInputParams::m_InputToForgetWeights
const ConstTensor * m_InputToForgetWeights
Definition: LstmParams.hpp:41

armnn::BackendsMap
std::map< BackendId, std::unique_ptr< class IBackendInternal > > BackendsMap
Definition: Network.hpp:318

ProfilingService.hpp

armnn::ResizeLayer
This layer represents a resize operation.
Definition: ResizeLayer.hpp:13

armnn::PermuteDescriptor
A PermuteDescriptor for the PermuteLayer.
Definition: Descriptors.hpp:110

armnn::OptimizedNetwork
Definition: Network.hpp:278

armnn::LayerType
LayerType
Definition: InternalTypes.hpp:83

armnn::BackendId
Definition: BackendId.hpp:75

armnn::LstmInputParams::m_InputToInputWeights
const ConstTensor * m_InputToInputWeights
Definition: LstmParams.hpp:40

anchors
std::vector< float > anchors({ 0.5f, 0.5f, 1.0f, 1.0f, 0.5f, 0.5f, 1.0f, 1.0f, 0.5f, 0.5f, 1.0f, 1.0f, 0.5f, 10.5f, 1.0f, 1.0f, 0.5f, 10.5f, 1.0f, 1.0f, 0.5f, 100.5f, 1.0f, 1.0f })