plain/20.08/_execute_network_8cpp_source.xhtml

 //
 // Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
 // SPDX-License-Identifier: MIT
 //

 #include "../NetworkExecutionUtils/NetworkExecutionUtils.hpp"

 // MAIN
 int main(int argc, const char* argv[])
 {
     // Configures logging for both the ARMNN library and this test program.
 #ifdef NDEBUG
     armnn::LogSeverity level = armnn::LogSeverity::Info;
 #else
     armnn::LogSeverity level = armnn::LogSeverity::Debug;
 #endif
     armnn::ConfigureLogging(true, true, level);

     std::string testCasesFile;

     std::string modelFormat;
     std::string modelPath;
     std::string inputNames;
     std::string inputTensorShapes;
     std::string inputTensorDataFilePaths;
     std::string outputNames;
     std::string inputTypes;
     std::string outputTypes;
     std::string dynamicBackendsPath;
     std::string outputTensorFiles;

     // external profiling parameters
     std::string outgoingCaptureFile;
     std::string incomingCaptureFile;
     uint32_t counterCapturePeriod;
     std::string fileFormat;

     size_t iterations = 1;
     int tuningLevel = 0;
     std::string tuningPath;

     double thresholdTime = 0.0;

     size_t subgraphId = 0;

     const std::string backendsMessage = "REQUIRED: Which device to run layers on by default. Possible choices: "
                                       + armnn::BackendRegistryInstance().GetBackendIdsAsString();
     po::options_description desc("Options");
     try
     {
         desc.add_options()
             ("help", "Display usage information")
             ("compute,c", po::value<std::vector<std::string>>()->multitoken()->required(),
              backendsMessage.c_str())
             ("test-cases,t", po::value(&testCasesFile), "Path to a CSV file containing test cases to run. "
              "If set, further parameters -- with the exception of compute device and concurrency -- will be ignored, "
              "as they are expected to be defined in the file for each test in particular.")
             ("concurrent,n", po::bool_switch()->default_value(false),
              "Whether or not the test cases should be executed in parallel")
             ("model-format,f", po::value(&modelFormat)->required(),
              "armnn-binary, caffe-binary, caffe-text, onnx-binary, onnx-text, tflite-binary, tensorflow-binary or "
              "tensorflow-text.")
             ("model-path,m", po::value(&modelPath)->required(), "Path to model file, e.g. .armnn, .caffemodel, "
              ".prototxt, .tflite, .onnx")
             ("dynamic-backends-path,b", po::value(&dynamicBackendsPath),
              "Path where to load any available dynamic backend from. "
              "If left empty (the default), dynamic backends will not be used.")
             ("input-name,i", po::value(&inputNames),
              "Identifier of the input tensors in the network separated by comma.")
             ("subgraph-number,x", po::value<size_t>(&subgraphId)->default_value(0), "Id of the subgraph to be executed."
               "Defaults to 0")
             ("input-tensor-shape,s", po::value(&inputTensorShapes),
              "The shape of the input tensors in the network as a flat array of integers separated by comma."
              "Several shapes can be passed by separating them with a colon (:)."
              "This parameter is optional, depending on the network.")
             ("input-tensor-data,d", po::value(&inputTensorDataFilePaths)->default_value(""),
              "Path to files containing the input data as a flat array separated by whitespace. "
              "Several paths can be passed by separating them with a comma. If not specified, the network will be run "
              "with dummy data (useful for profiling).")
             ("input-type,y",po::value(&inputTypes), "The type of the input tensors in the network separated by comma. "
              "If unset, defaults to \"float\" for all defined inputs. "
              "Accepted values (float, int or qasymm8)")
             ("quantize-input,q",po::bool_switch()->default_value(false),
              "If this option is enabled, all float inputs will be quantized to qasymm8. "
              "If unset, default to not quantized. "
              "Accepted values (true or false)")
             ("output-type,z",po::value(&outputTypes),
              "The type of the output tensors in the network separated by comma. "
              "If unset, defaults to \"float\" for all defined outputs. "
              "Accepted values (float, int or qasymm8).")
             ("dequantize-output,l",po::bool_switch()->default_value(false),
              "If this option is enabled, all quantized outputs will be dequantized to float. "
              "If unset, default to not get dequantized. "
              "Accepted values (true or false)")
             ("output-name,o", po::value(&outputNames),
              "Identifier of the output tensors in the network separated by comma.")
             ("write-outputs-to-file,w", po::value(&outputTensorFiles),
              "Comma-separated list of output file paths keyed with the binding-id of the output slot. "
              "If left empty (the default), the output tensors will not be written to a file.")
             ("event-based-profiling,e", po::bool_switch()->default_value(false),
              "Enables built in profiler. If unset, defaults to off.")
             ("visualize-optimized-model,v", po::bool_switch()->default_value(false),
              "Enables built optimized model visualizer. If unset, defaults to off.")
             ("bf16-turbo-mode", po::bool_switch()->default_value(false), "If this option is enabled, FP32 layers, "
              "weights and biases will be converted to BFloat16 where the backend supports it")
             ("fp16-turbo-mode,h", po::bool_switch()->default_value(false), "If this option is enabled, FP32 layers, "
              "weights and biases will be converted to FP16 where the backend supports it")
             ("threshold-time,r", po::value<double>(&thresholdTime)->default_value(0.0),
              "Threshold time is the maximum allowed time for inference measured in milliseconds. If the actual "
              "inference time is greater than the threshold time, the test will fail. By default, no threshold "
              "time is used.")
             ("print-intermediate-layers,p", po::bool_switch()->default_value(false),
              "If this option is enabled, the output of every graph layer will be printed.")
             ("enable-external-profiling,a", po::bool_switch()->default_value(false),
              "If enabled external profiling will be switched on")
             ("timeline-profiling", po::bool_switch()->default_value(false),
              "If enabled timeline profiling will be switched on, requires external profiling")
             ("outgoing-capture-file,j", po::value(&outgoingCaptureFile),
              "If specified the outgoing external profiling packets will be captured in this binary file")
             ("incoming-capture-file,k", po::value(&incomingCaptureFile),
              "If specified the incoming external profiling packets will be captured in this binary file")
             ("file-only-external-profiling,g", po::bool_switch()->default_value(false),
              "If enabled then the 'file-only' test mode of external profiling will be enabled")
             ("counter-capture-period,u", po::value<uint32_t>(&counterCapturePeriod)->default_value(150u),
              "If profiling is enabled in 'file-only' mode this is the capture period that will be used in the test")
             ("file-format", po::value(&fileFormat)->default_value("binary"),
              "If profiling is enabled specifies the output file format")
             ("iterations", po::value<size_t>(&iterations)->default_value(1),
              "Number of iterations to run the network for, default is set to 1")
             ("tuning-path", po::value(&tuningPath),
             "Path to tuning file. Enables use of CL tuning")
             ("tuning-level", po::value<int>(&tuningLevel)->default_value(0),
              "Sets the tuning level which enables a tuning run which will update/create a tuning file. "
              "Available options are: 1 (Rapid), 2 (Normal), 3 (Exhaustive). "
              "Requires tuning-path to be set, default is set to 0 (No tuning run)")
             ("parse-unsupported", po::bool_switch()->default_value(false),
                 "Add unsupported operators as stand-in layers (where supported by parser)")
             ("infer-output-shape", po::bool_switch()->default_value(false),
                 "Infers output tensor shape from input tensor shape and validate where applicable (where supported by "
                 "parser)");
     }
     catch (const std::exception& e)
     {
         // Coverity points out that default_value(...) can throw a bad_lexical_cast,
         // and that desc.add_options() can throw boost::io::too_few_args.
         // They really won't in any of these cases.
         ARMNN_ASSERT_MSG(false, "Caught unexpected exception");
         ARMNN_LOG(fatal) << "Fatal internal error: " << e.what();
         return EXIT_FAILURE;
     }

     // Parses the command-line.
     po::variables_map vm;
     try
     {
         po::store(po::parse_command_line(argc, argv, desc), vm);

         if (CheckOption(vm, "help") || argc <= 1)
         {
             std::cout << "Executes a neural network model using the provided input tensor. " << std::endl;
             std::cout << "Prints the resulting output tensor." << std::endl;
             std::cout << std::endl;
             std::cout << desc << std::endl;
             return EXIT_SUCCESS;
         }

         po::notify(vm);
     }
     catch (const po::error& e)
     {
         std::cerr << e.what() << std::endl << std::endl;
         std::cerr << desc << std::endl;
         return EXIT_FAILURE;
     }

     // Get the value of the switch arguments.
     bool concurrent = vm["concurrent"].as<bool>();
     bool enableProfiling = vm["event-based-profiling"].as<bool>();
     bool enableLayerDetails = vm["visualize-optimized-model"].as<bool>();
     bool enableBf16TurboMode = vm["bf16-turbo-mode"].as<bool>();
     bool enableFp16TurboMode = vm["fp16-turbo-mode"].as<bool>();
     bool quantizeInput = vm["quantize-input"].as<bool>();
     bool dequantizeOutput = vm["dequantize-output"].as<bool>();
     bool printIntermediate = vm["print-intermediate-layers"].as<bool>();
     bool enableExternalProfiling = vm["enable-external-profiling"].as<bool>();
     bool fileOnlyExternalProfiling = vm["file-only-external-profiling"].as<bool>();
     bool parseUnsupported = vm["parse-unsupported"].as<bool>();
     bool timelineEnabled = vm["timeline-profiling"].as<bool>();
     bool inferOutputShape = vm["infer-output-shape"].as<bool>();

     if (enableBf16TurboMode && enableFp16TurboMode)
     {
         ARMNN_LOG(fatal) << "BFloat16 and Float16 turbo mode cannot be enabled at the same time.";
         return EXIT_FAILURE;
     }

     // Create runtime
     armnn::IRuntime::CreationOptions options;
     options.m_EnableGpuProfiling                     = enableProfiling;
     options.m_DynamicBackendsPath                    = dynamicBackendsPath;
     options.m_ProfilingOptions.m_EnableProfiling     = enableExternalProfiling;
     options.m_ProfilingOptions.m_IncomingCaptureFile = incomingCaptureFile;
     options.m_ProfilingOptions.m_OutgoingCaptureFile = outgoingCaptureFile;
     options.m_ProfilingOptions.m_FileOnly            = fileOnlyExternalProfiling;
     options.m_ProfilingOptions.m_CapturePeriod       = counterCapturePeriod;
     options.m_ProfilingOptions.m_FileFormat          = fileFormat;
     options.m_ProfilingOptions.m_TimelineEnabled     = timelineEnabled;

     if (timelineEnabled && !enableExternalProfiling)
     {
         ARMNN_LOG(fatal) << "Timeline profiling requires external profiling to be turned on";
         return EXIT_FAILURE;
     }

     // Check whether we have to load test cases from a file.
     if (CheckOption(vm, "test-cases"))
     {
         // Check that the file exists.
         if (!fs::exists(testCasesFile))
         {
             ARMNN_LOG(fatal) << "Given file \"" << testCasesFile << "\" does not exist";
             return EXIT_FAILURE;
         }

         // Parse CSV file and extract test cases
         armnnUtils::CsvReader reader;
         std::vector<armnnUtils::CsvRow> testCases = reader.ParseFile(testCasesFile);

         // Check that there is at least one test case to run
         if (testCases.empty())
         {
             ARMNN_LOG(fatal) << "Given file \"" << testCasesFile << "\" has no test cases";
             return EXIT_FAILURE;
         }
         // Create runtime
         std::shared_ptr<armnn::IRuntime> runtime(armnn::IRuntime::Create(options));

         const std::string executableName("ExecuteNetwork");

         // Check whether we need to run the test cases concurrently
         if (concurrent)
         {
             std::vector<std::future<int>> results;
             results.reserve(testCases.size());

             // Run each test case in its own thread
             for (auto&  testCase : testCases)
             {
                 testCase.values.insert(testCase.values.begin(), executableName);
                 results.push_back(std::async(std::launch::async, RunCsvTest, std::cref(testCase), std::cref(runtime),
                                              enableProfiling, enableFp16TurboMode, enableBf16TurboMode, thresholdTime,
                                              printIntermediate, enableLayerDetails, parseUnsupported,
                                              inferOutputShape));
             }

             // Check results
             for (auto& result : results)
             {
                 if (result.get() != EXIT_SUCCESS)
                 {
                     return EXIT_FAILURE;
                 }
             }
         }
         else
         {
             // Run tests sequentially
             for (auto&  testCase : testCases)
             {
                 testCase.values.insert(testCase.values.begin(), executableName);
                 if (RunCsvTest(testCase, runtime, enableProfiling,
                                enableFp16TurboMode, enableBf16TurboMode, thresholdTime, printIntermediate,
                                enableLayerDetails, parseUnsupported, inferOutputShape) != EXIT_SUCCESS)
                 {
                     return EXIT_FAILURE;
                 }
             }
         }

         return EXIT_SUCCESS;
     }
     else // Run single test
     {
         // Get the preferred order of compute devices. If none are specified, default to using CpuRef
         const std::string computeOption("compute");
         std::vector<std::string> computeDevicesAsStrings =
                 CheckOption(vm, computeOption.c_str()) ?
                     vm[computeOption].as<std::vector<std::string>>() :
                     std::vector<std::string>();
         std::vector<armnn::BackendId> computeDevices(computeDevicesAsStrings.begin(), computeDevicesAsStrings.end());

         // Remove duplicates from the list of compute devices.
         RemoveDuplicateDevices(computeDevices);

 #if defined(ARMCOMPUTECL_ENABLED)
         std::shared_ptr<armnn::IGpuAccTunedParameters> tuned_params;

         if (tuningPath != "")
         {
             if (tuningLevel != 0)
             {
                 RunCLTuning(tuningPath, tuningLevel, modelFormat, inputTensorShapes, computeDevices,
                     dynamicBackendsPath, modelPath, inputNames, inputTensorDataFilePaths, inputTypes, quantizeInput,
                     outputTypes, outputNames, outputTensorFiles, dequantizeOutput, enableProfiling,
                     enableFp16TurboMode, enableBf16TurboMode, thresholdTime, printIntermediate, subgraphId,
                     enableLayerDetails, parseUnsupported, inferOutputShape);
             }
             ARMNN_LOG(info) << "Using tuning params: " << tuningPath << "\n";
             options.m_BackendOptions.emplace_back(
                 armnn::BackendOptions
                 {
                     "GpuAcc",
                     {
                         {"TuningLevel", 0},
                         {"TuningFile", tuningPath.c_str()},
                         {"KernelProfilingEnabled", enableProfiling}
                     }
                 }
             );
         }
 #endif
         try
         {
             CheckOptionDependencies(vm);
         }
         catch (const po::error& e)
         {
             std::cerr << e.what() << std::endl << std::endl;
             std::cerr << desc << std::endl;
             return EXIT_FAILURE;
         }
         // Create runtime
         std::shared_ptr<armnn::IRuntime> runtime(armnn::IRuntime::Create(options));

         return RunTest(modelFormat, inputTensorShapes, computeDevices, dynamicBackendsPath, modelPath,
             inputNames, inputTensorDataFilePaths, inputTypes, quantizeInput, outputTypes, outputNames,
             outputTensorFiles, dequantizeOutput, enableProfiling, enableFp16TurboMode, enableBf16TurboMode,
             thresholdTime, printIntermediate, subgraphId, enableLayerDetails, parseUnsupported, inferOutputShape,
             iterations, runtime);
     }
 }
armnn::IRuntime::Create
static IRuntimePtr Create(const CreationOptions &options)
Definition: Runtime.cpp:32

RunCsvTest
int RunCsvTest(const armnnUtils::CsvRow &csvRow, const std::shared_ptr< armnn::IRuntime > &runtime, const bool enableProfiling, const bool enableFp16TurboMode, const bool enableBf16TurboMode, const double &thresholdTime, const bool printIntermediate, bool enableLayerDetails=false, bool parseUnuspported=false, bool inferOutputShape=false)
Definition: NetworkExecutionUtils.hpp:753

armnn::IRuntime::CreationOptions::ExternalProfilingOptions::m_OutgoingCaptureFile
std::string m_OutgoingCaptureFile
Definition: IRuntime.hpp:76

RunCLTuning
int RunCLTuning(const std::string &tuningPath, const int tuningLevel, const std::string &modelFormat, const std::string &inputTensorShapes, const vector< armnn::BackendId > &computeDevices, const std::string &dynamicBackendsPath, const std::string &modelPath, const std::string &inputNames, const std::string &inputTensorDataFilePaths, const std::string &inputTypes, bool quantizeInput, const std::string &outputTypes, const std::string &outputNames, const std::string &outputTensorFiles, bool dequantizeOutput, bool enableProfiling, bool enableFp16TurboMode, bool enableBf16TurboMode, const double &thresholdTime, bool printIntermediate, const size_t subgraphId, bool enableLayerDetails=false, bool parseUnsupported=false, bool inferOutputShape=false)
Definition: NetworkExecutionUtils.hpp:881

armnn::ConfigureLogging
void ConfigureLogging(bool printToStandardOutput, bool printToDebugOutput, LogSeverity severity)
Configures the logging behaviour of the ARMNN library.
Definition: Utils.cpp:10

RunTest
int RunTest(const std::string &format, const std::string &inputTensorShapesStr, const vector< armnn::BackendId > &computeDevices, const std::string &dynamicBackendsPath, const std::string &path, const std::string &inputNames, const std::string &inputTensorDataFilePaths, const std::string &inputTypes, bool quantizeInput, const std::string &outputTypes, const std::string &outputNames, const std::string &outputTensorFiles, bool dequantizeOuput, bool enableProfiling, bool enableFp16TurboMode, bool enableBf16TurboMode, const double &thresholdTime, bool printIntermediate, const size_t subgraphId, bool enableLayerDetails=false, bool parseUnsupported=false, bool inferOutputShape=false, const size_t iterations=1, const std::shared_ptr< armnn::IRuntime > &runtime=nullptr)
Definition: NetworkExecutionUtils.hpp:534

ARMNN_LOG
#define ARMNN_LOG(severity)
Definition: Logging.hpp:163

armnn::BackendRegistryInstance
BackendRegistry & BackendRegistryInstance()
Definition: BackendRegistry.cpp:13

armnn::BackendRegistry::GetBackendIdsAsString
std::string GetBackendIdsAsString() const
Definition: BackendRegistry.cpp:82

armnn::IRuntime::CreationOptions::ExternalProfilingOptions::m_IncomingCaptureFile
std::string m_IncomingCaptureFile
Definition: IRuntime.hpp:77

armnn::IRuntime::CreationOptions::ExternalProfilingOptions::m_EnableProfiling
bool m_EnableProfiling
Definition: IRuntime.hpp:74

armnn::IRuntime::CreationOptions::ExternalProfilingOptions::m_FileOnly
bool m_FileOnly
Definition: IRuntime.hpp:78

armnn::LogSeverity::Info

armnn::IRuntime::CreationOptions::m_BackendOptions
std::vector< BackendOptions > m_BackendOptions
Pass backend specific options.
Definition: IRuntime.hpp:115

ARMNN_ASSERT_MSG
#define ARMNN_ASSERT_MSG(COND, MSG)
Definition: Assert.hpp:15

armnn::LogSeverity::Debug

armnn::IRuntime::CreationOptions
Definition: IRuntime.hpp:42

armnn::BackendOptions
Struct for the users to pass backend specific options.
Definition: BackendOptions.hpp:18

armnn::IRuntime::CreationOptions::m_DynamicBackendsPath
std::string m_DynamicBackendsPath
Setting this value will override the paths set by the DYNAMIC_BACKEND_PATHS compiler directive Only a...
Definition: IRuntime.hpp:59

armnn::IRuntime::CreationOptions::m_EnableGpuProfiling
bool m_EnableGpuProfiling
Setting this flag will allow the user to obtain GPU profiling information from the runtime...
Definition: IRuntime.hpp:55

main
int main(int argc, const char *argv[])
Definition: ExecuteNetwork.cpp:9

armnn::IRuntime::CreationOptions::ExternalProfilingOptions::m_CapturePeriod
uint32_t m_CapturePeriod
Definition: IRuntime.hpp:79

armnnUtils::CsvReader
Definition: CsvReader.hpp:18

armnn::IRuntime::CreationOptions::ExternalProfilingOptions::m_TimelineEnabled
bool m_TimelineEnabled
Definition: IRuntime.hpp:75

armnnUtils::CsvReader::ParseFile
static std::vector< CsvRow > ParseFile(const std::string &csvFile)
Definition: CsvReader.cpp:32

armnn::IRuntime::CreationOptions::m_ProfilingOptions
ExternalProfilingOptions m_ProfilingOptions
Definition: IRuntime.hpp:83

armnn::LogSeverity
LogSeverity
Definition: Utils.hpp:12

armnn::IRuntime::CreationOptions::ExternalProfilingOptions::m_FileFormat
std::string m_FileFormat
Definition: IRuntime.hpp:80