// // Copyright © 2022 Arm Ltd and Contributors. All rights reserved. // SPDX-License-Identifier: MIT // #define LOG_TAG "arm-armnn-sl" #include "DriverOptions.hpp" #include "CanonicalUtils.hpp" #include #include #include "SystemPropertiesUtils.hpp" #include #include #include #include #include #include #include using namespace android; using namespace std; namespace armnn_driver { DriverOptions::DriverOptions(armnn::Compute computeDevice, bool fp16Enabled) : m_Backends({computeDevice}) , m_VerboseLogging(false) , m_RequestInputsAndOutputsDumpDir(std::string("")) , m_ServiceName(std::string("armnn_sl")) , m_ForcedUnsupportedOperations({}) , m_ClTunedParametersMode(armnn::IGpuAccTunedParameters::Mode::UseTunedParameters) , m_ClTuningLevel(armnn::IGpuAccTunedParameters::TuningLevel::Rapid) , m_EnableGpuProfiling(false) , m_fp16Enabled(fp16Enabled) , m_FastMathEnabled(false) , m_ShouldExit(false) , m_ExitCode(EXIT_SUCCESS) , m_CachedNetworkFilePath(std::string("")) , m_SaveCachedNetwork(false) , m_NumberOfThreads(0) , m_EnableAsyncModelExecution(false) , m_ArmnnNumberOfThreads(1) { } DriverOptions::DriverOptions(const std::vector& backends, bool fp16Enabled) : m_Backends(backends) , m_VerboseLogging(false) , m_RequestInputsAndOutputsDumpDir(std::string("")) , m_ServiceName(std::string("armnn_sl")) , m_ForcedUnsupportedOperations({}) , m_ClTunedParametersMode(armnn::IGpuAccTunedParameters::Mode::UseTunedParameters) , m_ClTuningLevel(armnn::IGpuAccTunedParameters::TuningLevel::Rapid) , m_EnableGpuProfiling(false) , m_fp16Enabled(fp16Enabled) , m_FastMathEnabled(false) , m_ShouldExit(false) , m_ExitCode(EXIT_SUCCESS) , m_CachedNetworkFilePath(std::string("")) , m_SaveCachedNetwork(false) , m_NumberOfThreads(0) , m_EnableAsyncModelExecution(false) , m_ArmnnNumberOfThreads(1) { } // This default constructor will example an environment variable called // ARMNN_SL_OPTIONS. It will parse the parameters using the existing cxx // opts mechanism. DriverOptions::DriverOptions() : m_VerboseLogging(false) , m_RequestInputsAndOutputsDumpDir(std::string("")) , m_ServiceName(std::string("armnn_sl")) , m_ForcedUnsupportedOperations({}) , m_ClTunedParametersMode(armnn::IGpuAccTunedParameters::Mode::UseTunedParameters) , m_ClTuningLevel(armnn::IGpuAccTunedParameters::TuningLevel::Rapid) , m_EnableGpuProfiling(false) , m_fp16Enabled(false) , m_FastMathEnabled(false) , m_ShouldExit(false) , m_SaveCachedNetwork(false) , m_NumberOfThreads(0) , m_EnableAsyncModelExecution(false) , m_ArmnnNumberOfThreads(1) { std::string unsupportedOperationsAsString; std::string clTunedParametersModeAsString; std::string clTuningLevelAsString; std::vector backends; bool showHelp = false; bool showVersion = false; const char* rawEnv = std::getenv("ARMNN_SL_OPTIONS"); // If the environment variable isn't set we'll continue as if it were an empty string. if (!rawEnv) { rawEnv = ""; } string optionsAsString(rawEnv); regex whiteSpaceRegex("\\s+"); // Tokienize the string based on whitespace. sregex_token_iterator iter(optionsAsString.begin(), optionsAsString.end(), whiteSpaceRegex, -1); sregex_token_iterator end; vector cliAsVector(iter, end); // As we're pretending to be a command line, argv[0] should be an executable name. cliAsVector.insert(cliAsVector.begin(), "ARMNN_SL_OPTIONS"); // Convert the vector of string to a vector of char* backed by the existing vector. std::vector argVector; for (const auto& arg : cliAsVector) { argVector.push_back((char*)arg.data()); } // Terminate the array. argVector.push_back(nullptr); // Create usable variables. int argc = argVector.size() - 1; // Ignore the null pointer at the end. char** argv = argVector.data(); cxxopts::Options optionsDesc(argv[0], "Arm NN Support Library for the Android Neural Networks API." "The support library will convert Android NNAPI requests " "and delegate them to available ArmNN backends."); try { optionsDesc.add_options() ("a,enable-fast-math", "Enables fast_math options in backends that support it. Using the fast_math flag can " "lead to performance improvements but may result in reduced or different precision.", cxxopts::value(m_FastMathEnabled)->default_value("false")) ("c,compute","Comma separated list of backends to run layers on. " "Examples of possible values are: CpuRef, CpuAcc, GpuAcc", cxxopts::value>(backends)) ("d,request-inputs-and-outputs-dump-dir", "If non-empty, the directory where request inputs and outputs should be dumped", cxxopts::value(m_RequestInputsAndOutputsDumpDir)->default_value("")) ("f,fp16-enabled", "Enables support for relaxed computation from Float32 to Float16", cxxopts::value(m_fp16Enabled)->default_value("false")) ("h,help", "Show this help", cxxopts::value(showHelp)->default_value("false")->implicit_value("true")) ("m,cl-tuned-parameters-mode", "If 'UseTunedParameters' (the default), will read CL tuned parameters from the file specified by " "--cl-tuned-parameters-file. " "If 'UpdateTunedParameters', will also find the optimum parameters when preparing new networks and update " "the file accordingly.", cxxopts::value(clTunedParametersModeAsString)->default_value("UseTunedParameters")) ("g,mlgo-cl-tuned-parameters-file", "If non-empty, the given file will be used to load/save MLGO CL tuned parameters. ", cxxopts::value(m_ClMLGOTunedParametersFile)->default_value("")) ("o,cl-tuning-level", "exhaustive: all lws values are tested " "normal: reduced number of lws values but enough to still have the performance really close to the " "exhaustive approach " "rapid: only 3 lws values should be tested for each kernel ", cxxopts::value(clTuningLevelAsString)->default_value("rapid")) ("p,gpu-profiling", "Turns GPU profiling on", cxxopts::value(m_EnableGpuProfiling)->default_value("false")) ("q,cached-network-file", "If non-empty, the given file will be used to load/save cached network. " "If save-cached-network option is given will save the cached network to given file." "If save-cached-network option is not given will load the cached network from given " "file.", cxxopts::value(m_CachedNetworkFilePath)->default_value("")) ("s,save-cached-network", "Enables saving the cached network to the file given with cached-network-file option." " See also --cached-network-file", cxxopts::value(m_SaveCachedNetwork)->default_value("false")) ("number-of-threads", "Assign the number of threads used by the CpuAcc backend. " "Input value must be between 1 and 64. " "Default is set to 0 (Backend will decide number of threads to use).", cxxopts::value(m_NumberOfThreads)->default_value("0")) ("t,cl-tuned-parameters-file", "If non-empty, the given file will be used to load/save CL tuned parameters. " "See also --cl-tuned-parameters-mode", cxxopts::value(m_ClTunedParametersFile)->default_value("")) ("u,unsupported-operations", "If non-empty, a comma-separated list of operation indices which the driver will forcibly " "consider unsupported", cxxopts::value(unsupportedOperationsAsString)->default_value("")) ("v,verbose-logging", "Turns verbose logging on", cxxopts::value(m_VerboseLogging)->default_value("false")->implicit_value("true")) ("V,version", "Show version information", cxxopts::value(showVersion)->default_value("false")->implicit_value("true")) ; } catch (const std::exception& e) { VLOG(DRIVER) << "An error occurred attempting to construct options: " << e.what(); std::cout << "An error occurred attempting to construct options: %s" << std::endl; m_ExitCode = EXIT_FAILURE; return; } try { cxxopts::ParseResult result = optionsDesc.parse(argc, argv); } catch (const cxxopts::OptionException& e) { VLOG(DRIVER) << "An exception occurred attempting to parse program options: " << e.what(); std::cout << optionsDesc.help() << std::endl << "An exception occurred while parsing program options: " << std::endl << e.what() << std::endl; m_ShouldExit = true; m_ExitCode = EXIT_FAILURE; return; } if (showHelp) { VLOG(DRIVER) << "Showing help and exiting"; std::cout << optionsDesc.help() << std::endl; m_ShouldExit = true; m_ExitCode = EXIT_SUCCESS; return; } if (showVersion) { VLOG(DRIVER) << "Showing version and exiting"; std::cout << "ArmNN Android NN driver for the Android Neural Networks API.\n" "ArmNN v" << ARMNN_VERSION << std::endl; m_ShouldExit = true; m_ExitCode = EXIT_SUCCESS; return; } // Convert the string backend names into backendId's. m_Backends.reserve(backends.size()); for (auto&& backend : backends) { m_Backends.emplace_back(backend); } // If no backends have been specified then the default value is GpuAcc. if (backends.empty()) { VLOG(DRIVER) << "No backends have been specified:"; std::cout << optionsDesc.help() << std::endl << "Unable to start:" << std::endl << "No backends have been specified" << std::endl; m_ShouldExit = true; m_ExitCode = EXIT_FAILURE; return; } if (!unsupportedOperationsAsString.empty()) { std::istringstream argStream(unsupportedOperationsAsString); std::string s; while (!argStream.eof()) { std::getline(argStream, s, ','); try { unsigned int operationIdx = std::stoi(s); m_ForcedUnsupportedOperations.insert(operationIdx); } catch (const std::invalid_argument&) { VLOG(DRIVER) << "Ignoring invalid integer argument in -u/--unsupported-operations value: " << s.c_str(); } } } if (!m_ClTunedParametersFile.empty()) { // The mode is only relevant if the file path has been provided if (clTunedParametersModeAsString == "UseTunedParameters") { m_ClTunedParametersMode = armnn::IGpuAccTunedParameters::Mode::UseTunedParameters; } else if (clTunedParametersModeAsString == "UpdateTunedParameters") { m_ClTunedParametersMode = armnn::IGpuAccTunedParameters::Mode::UpdateTunedParameters; } else { VLOG(DRIVER) << "Requested unknown cl-tuned-parameters-mode " << clTunedParametersModeAsString.c_str() << ". Defaulting to UseTunedParameters"; } if (clTuningLevelAsString == "exhaustive") { m_ClTuningLevel = armnn::IGpuAccTunedParameters::TuningLevel::Exhaustive; } else if (clTuningLevelAsString == "normal") { m_ClTuningLevel = armnn::IGpuAccTunedParameters::TuningLevel::Normal; } else if (clTuningLevelAsString == "rapid") { m_ClTuningLevel = armnn::IGpuAccTunedParameters::TuningLevel::Rapid; } else { VLOG(DRIVER) << "Requested unknown cl-tuner-mode '%s'. " "Defaulting to rapid" << clTuningLevelAsString.c_str(); } } } } // namespace armnn_driver