openvino/inference-engine/samples/benchmark_app/main.cpp

// Copyright (C) 2018-2021 Intel Corporation
// SPDX-License-Identifier: Apache-2.0
//

#include <algorithm>
#include <chrono>
#include <gna/gna_config.hpp>
#include <gpu/gpu_config.hpp>
#include <inference_engine.hpp>
#include <map>
#include <memory>
#include <samples/args_helper.hpp>
#include <samples/common.hpp>
#include <samples/slog.hpp>
#include <string>
#include <utility>
#include <vector>
#include <vpu/vpu_plugin_config.hpp>

#include "benchmark_app.hpp"
#include "infer_request_wrap.hpp"
#include "inputs_filling.hpp"
#include "progress_bar.hpp"
#include "remote_blobs_filling.hpp"
#include "statistics_report.hpp"
#include "utils.hpp"

using namespace InferenceEngine;

static const size_t progressBarDefaultTotalCount = 1000;

uint64_t getDurationInMilliseconds(uint32_t duration) {
    return duration * 1000LL;
}

uint64_t getDurationInNanoseconds(uint32_t duration) {
    return duration * 1000000000LL;
}

bool ParseAndCheckCommandLine(int argc, char* argv[]) {
    // ---------------------------Parsing and validating input
    // arguments--------------------------------------
    slog::info << "Parsing input parameters" << slog::endl;
    gflags::ParseCommandLineNonHelpFlags(&argc, &argv, true);
    if (FLAGS_help || FLAGS_h) {
        showUsage();
        showAvailableDevices();
        return false;
    }

    if (FLAGS_m.empty()) {
        showUsage();
        throw std::logic_error("Model is required but not set. Please set -m option.");
    }

    if (FLAGS_latency_percentile > 100 || FLAGS_latency_percentile < 1) {
        showUsage();
        throw std::logic_error("The percentile value is incorrect. The applicable values range is [1, 100].");
    }
    if (FLAGS_api != "async" && FLAGS_api != "sync") {
        throw std::logic_error("Incorrect API. Please set -api option to `sync` or `async` value.");
    }
    if (!FLAGS_hint.empty() && FLAGS_hint != "throughput" && FLAGS_hint != "tput" && FLAGS_hint != "latency") {
        throw std::logic_error("Incorrect performance hint. Please set -hint option to"
                               "either `throughput`(tput) or `latency' value.");
    }
    if (!FLAGS_report_type.empty() && FLAGS_report_type != noCntReport && FLAGS_report_type != averageCntReport &&
        FLAGS_report_type != detailedCntReport) {
        std::string err = "only " + std::string(noCntReport) + "/" + std::string(averageCntReport) + "/" +
                          std::string(detailedCntReport) +
                          " report types are supported (invalid -report_type option value)";
        throw std::logic_error(err);
    }

    if ((FLAGS_report_type == averageCntReport) && ((FLAGS_d.find("MULTI") != std::string::npos))) {
        throw std::logic_error("only " + std::string(detailedCntReport) + " report type is supported for MULTI device");
    }

    bool isNetworkCompiled = fileExt(FLAGS_m) == "blob";
    bool isPrecisionSet = !(FLAGS_ip.empty() && FLAGS_op.empty() && FLAGS_iop.empty());
    if (isNetworkCompiled && isPrecisionSet) {
        std::string err = std::string("Cannot set precision for a compiled network. ") +
                          std::string("Please re-compile your network with required precision "
                                      "using compile_tool");

        throw std::logic_error(err);
    }
    return true;
}

static void next_step(const std::string additional_info = "") {
    static size_t step_id = 0;
    static const std::map<size_t, std::string> step_names = {
        {1, "Parsing and validating input arguments"},
        {2, "Loading Inference Engine"},
        {3, "Setting device configuration"},
        {4, "Reading network files"},
        {5, "Resizing network to match image sizes and given batch"},
        {6, "Configuring input of the model"},
        {7, "Loading the model to the device"},
        {8, "Setting optimal runtime parameters"},
        {9, "Creating infer requests and filling input blobs with images"},
        {10, "Measuring performance"},
        {11, "Dumping statistics report"}};

    step_id++;
    if (step_names.count(step_id) == 0)
        IE_THROW() << "Step ID " << step_id << " is out of total steps number " << step_names.size();

    std::cout << "[Step " << step_id << "/" << step_names.size() << "] " << step_names.at(step_id)
              << (additional_info.empty() ? "" : " (" + additional_info + ")") << std::endl;
}

template <typename T>
T getMedianValue(const std::vector<T>& vec, std::size_t percentile) {
    std::vector<T> sortedVec(vec);
    std::sort(sortedVec.begin(), sortedVec.end());
    return sortedVec[(sortedVec.size() / 100) * percentile];
}

/**
 * @brief The entry point of the benchmark application
 */
int main(int argc, char* argv[]) {
    std::shared_ptr<StatisticsReport> statistics;
    try {
        ExecutableNetwork exeNetwork;

        // ----------------- 1. Parsing and validating input arguments
        // -------------------------------------------------
        next_step();

        if (!ParseAndCheckCommandLine(argc, argv)) {
            return 0;
        }

        bool isNetworkCompiled = fileExt(FLAGS_m) == "blob";
        if (isNetworkCompiled) {
            slog::info << "Network is compiled" << slog::endl;
        }

        std::vector<gflags::CommandLineFlagInfo> flags;
        StatisticsReport::Parameters command_line_arguments;
        gflags::GetAllFlags(&flags);
        for (auto& flag : flags) {
            if (!flag.is_default) {
                command_line_arguments.push_back({flag.name, flag.current_value});
            }
        }
        if (!FLAGS_report_type.empty()) {
            statistics =
                std::make_shared<StatisticsReport>(StatisticsReport::Config{FLAGS_report_type, FLAGS_report_folder});
            statistics->addParameters(StatisticsReport::Category::COMMAND_LINE_PARAMETERS, command_line_arguments);
        }
        auto isFlagSetInCommandLine = [&command_line_arguments](const std::string& name) {
            return (std::find_if(command_line_arguments.begin(),
                                 command_line_arguments.end(),
                                 [name](const std::pair<std::string, std::string>& p) {
                                     return p.first == name;
                                 }) != command_line_arguments.end());
        };

        std::string device_name = FLAGS_d;

        // Parse devices
        auto devices = parseDevices(device_name);

        // Parse nstreams per device
        std::map<std::string, std::string> device_nstreams = parseNStreamsValuePerDevice(devices, FLAGS_nstreams);

        // Load device config file if specified
        std::map<std::string, std::map<std::string, std::string>> config;
#ifdef USE_OPENCV
        if (!FLAGS_load_config.empty()) {
            load_config(FLAGS_load_config, config);
        }
#endif
        /** This vector stores paths to the processed images **/
        std::vector<std::string> inputFiles;
        parseInputFilesArguments(inputFiles);

        // ----------------- 2. Loading the Inference Engine
        // -----------------------------------------------------------
        next_step();

        Core ie;
        if (FLAGS_d.find("CPU") != std::string::npos && !FLAGS_l.empty()) {
            // CPU (MKLDNN) extensions is loaded as a shared library and passed as a
            // pointer to base extension
            const auto extension_ptr = std::make_shared<InferenceEngine::Extension>(FLAGS_l);
            ie.AddExtension(extension_ptr);
            slog::info << "CPU (MKLDNN) extensions is loaded " << FLAGS_l << slog::endl;
        }

        // Load clDNN Extensions
        if ((FLAGS_d.find("GPU") != std::string::npos) && !FLAGS_c.empty()) {
            // Override config if command line parameter is specified
            if (!config.count("GPU"))
                config["GPU"] = {};
            config["GPU"][CONFIG_KEY(CONFIG_FILE)] = FLAGS_c;
        }
        if (config.count("GPU") && config.at("GPU").count(CONFIG_KEY(CONFIG_FILE))) {
            auto ext = config.at("GPU").at(CONFIG_KEY(CONFIG_FILE));
            ie.SetConfig({{CONFIG_KEY(CONFIG_FILE), ext}}, "GPU");
            slog::info << "GPU extensions is loaded " << ext << slog::endl;
        }

        slog::info << "InferenceEngine: " << GetInferenceEngineVersion() << slog::endl;
        slog::info << "Device info: " << slog::endl;
        std::cout << ie.GetVersions(device_name) << std::endl;

        // ----------------- 3. Setting device configuration
        // -----------------------------------------------------------
        next_step();
        std::string ov_perf_hint;
        if (FLAGS_hint == "throughput" || FLAGS_hint == "tput")
            ov_perf_hint = CONFIG_VALUE(THROUGHPUT);
        else if (FLAGS_hint == "latency")
            ov_perf_hint = CONFIG_VALUE(LATENCY);

        auto getDeviceTypeFromName = [](std::string device) -> std::string {
            return device.substr(0, device.find_first_of(".("));
        };

        // Set default values from dumped config
        std::set<std::string> default_devices;
        for (auto& device : devices) {
            auto default_config = config.find(getDeviceTypeFromName(device));
            if (default_config != config.end()) {
                if (!config.count(device)) {
                    config[device] = default_config->second;
                    default_devices.emplace(default_config->first);
                }
            }
        }
        for (auto& device : default_devices) {
            config.erase(device);
        }

        bool perf_counts = false;
        // Update config per device according to command line parameters
        for (auto& device : devices) {
            if (!config.count(device))
                config[device] = {};
            std::map<std::string, std::string>& device_config = config.at(device);

            // high-level performance modes
            if (!ov_perf_hint.empty()) {
                device_config[CONFIG_KEY(PERFORMANCE_HINT)] = ov_perf_hint;
                if (FLAGS_nireq != 0)
                    device_config[CONFIG_KEY(PERFORMANCE_HINT_NUM_REQUESTS)] = std::to_string(FLAGS_nireq);
            }

            // Set performance counter
            if (isFlagSetInCommandLine("pc")) {
                // set to user defined value
                device_config[CONFIG_KEY(PERF_COUNT)] = FLAGS_pc ? CONFIG_VALUE(YES) : CONFIG_VALUE(NO);
            } else if (device_config.count(CONFIG_KEY(PERF_COUNT)) &&
                       (device_config.at(CONFIG_KEY(PERF_COUNT)) == "YES")) {
                slog::warn << "Performance counters for " << device
                           << " device is turned on. To print results use -pc option." << slog::endl;
            } else if (FLAGS_report_type == detailedCntReport || FLAGS_report_type == averageCntReport) {
                slog::warn << "Turn on performance counters for " << device << " device since report type is "
                           << FLAGS_report_type << "." << slog::endl;
                device_config[CONFIG_KEY(PERF_COUNT)] = CONFIG_VALUE(YES);
            } else if (!FLAGS_exec_graph_path.empty()) {
                slog::warn << "Turn on performance counters for " << device << " device due to execution graph dumping."
                           << slog::endl;
                device_config[CONFIG_KEY(PERF_COUNT)] = CONFIG_VALUE(YES);
            } else {
                // set to default value
                device_config[CONFIG_KEY(PERF_COUNT)] = FLAGS_pc ? CONFIG_VALUE(YES) : CONFIG_VALUE(NO);
            }
            perf_counts = (device_config.at(CONFIG_KEY(PERF_COUNT)) == CONFIG_VALUE(YES)) ? true : perf_counts;

            // the rest are individual per-device settings (overriding the values set with perf modes)
            auto setThroughputStreams = [&]() {
                const std::string key = getDeviceTypeFromName(device) + "_THROUGHPUT_STREAMS";
                if (device_nstreams.count(device)) {
                    // set to user defined value
                    std::vector<std::string> supported_config_keys =
                        ie.GetMetric(device, METRIC_KEY(SUPPORTED_CONFIG_KEYS));
                    if (std::find(supported_config_keys.begin(), supported_config_keys.end(), key) ==
                        supported_config_keys.end()) {
                        throw std::logic_error("Device " + device + " doesn't support config key '" + key + "'! " +
                                               "Please specify -nstreams for correct devices in format  "
                                               "<dev1>:<nstreams1>,<dev2>:<nstreams2>" +
                                               " or via configuration file.");
                    }
                    device_config[key] = device_nstreams.at(device);
                } else if (ov_perf_hint.empty() && !device_config.count(key) && (FLAGS_api == "async")) {
                    slog::warn << "-nstreams default value is determined automatically for " << device
                               << " device. "
                                  "Although the automatic selection usually provides a "
                                  "reasonable performance, "
                                  "but it still may be non-optimal for some cases, for more "
                                  "information look at README."
                               << slog::endl;
                    if (std::string::npos == device.find("MYRIAD"))  // MYRIAD sets the default number of
                                                                     // streams implicitly (without _AUTO)
                        device_config[key] = std::string(getDeviceTypeFromName(device) + "_THROUGHPUT_AUTO");
                }
                if (device_config.count(key))
                    device_nstreams[device] = device_config.at(key);
            };

            if (device.find("CPU") != std::string::npos) {  // CPU supports few special performance-oriented keys
                // limit threading for CPU portion of inference
                if (isFlagSetInCommandLine("nthreads"))
                    device_config[CONFIG_KEY(CPU_THREADS_NUM)] = std::to_string(FLAGS_nthreads);

                if (isFlagSetInCommandLine("enforcebf16"))
                    device_config[CONFIG_KEY(ENFORCE_BF16)] = FLAGS_enforcebf16 ? CONFIG_VALUE(YES) : CONFIG_VALUE(NO);

                if (isFlagSetInCommandLine("pin")) {
                    // set to user defined value
                    device_config[CONFIG_KEY(CPU_BIND_THREAD)] = FLAGS_pin;
                } else if (!device_config.count(CONFIG_KEY(CPU_BIND_THREAD))) {
                    if ((device_name.find("MULTI") != std::string::npos) &&
                        (device_name.find("GPU") != std::string::npos)) {
                        slog::warn << "Turn off threads pinning for " << device
                                   << " device since multi-scenario with GPU device is used." << slog::endl;
                        device_config[CONFIG_KEY(CPU_BIND_THREAD)] = CONFIG_VALUE(NO);
                    }
                }

                // for CPU execution, more throughput-oriented execution via streams
                setThroughputStreams();
            } else if (device.find("GPU") != std::string::npos) {
                // for GPU execution, more throughput-oriented execution via streams
                setThroughputStreams();

                if ((device_name.find("MULTI") != std::string::npos) &&
                    (device_name.find("CPU") != std::string::npos)) {
                    slog::warn << "Turn on GPU throttling. Multi-device execution with "
                                  "the CPU + GPU performs best with GPU throttling hint, "
                               << "which releases another CPU thread (that is otherwise "
                                  "used by the GPU driver for active polling)"
                               << slog::endl;
                    device_config[GPU_CONFIG_KEY(PLUGIN_THROTTLE)] = "1";
                }
            } else if (device.find("MYRIAD") != std::string::npos) {
                device_config[CONFIG_KEY(LOG_LEVEL)] = CONFIG_VALUE(LOG_WARNING);
                setThroughputStreams();
            } else if (device.find("GNA") != std::string::npos) {
                if (FLAGS_qb == 8)
                    device_config[GNA_CONFIG_KEY(PRECISION)] = "I8";
                else
                    device_config[GNA_CONFIG_KEY(PRECISION)] = "I16";

                if (isFlagSetInCommandLine("nthreads"))
                    device_config[GNA_CONFIG_KEY(LIB_N_THREADS)] = std::to_string(FLAGS_nthreads);
            } else {
                std::vector<std::string> supported_config_keys =
                    ie.GetMetric(device, METRIC_KEY(SUPPORTED_CONFIG_KEYS));
                auto supported = [&](const std::string& key) {
                    return std::find(std::begin(supported_config_keys), std::end(supported_config_keys), key) !=
                           std::end(supported_config_keys);
                };
                if (supported(CONFIG_KEY(CPU_THREADS_NUM)) && isFlagSetInCommandLine("nthreads")) {
                    device_config[CONFIG_KEY(CPU_THREADS_NUM)] = std::to_string(FLAGS_nthreads);
                }
                if (supported(CONFIG_KEY(CPU_THROUGHPUT_STREAMS)) && isFlagSetInCommandLine("nstreams")) {
                    device_config[CONFIG_KEY(CPU_THROUGHPUT_STREAMS)] = FLAGS_nstreams;
                }
                if (supported(CONFIG_KEY(CPU_BIND_THREAD)) && isFlagSetInCommandLine("pin")) {
                    device_config[CONFIG_KEY(CPU_BIND_THREAD)] = FLAGS_pin;
                }
            }
        }

        for (auto&& item : config) {
            ie.SetConfig(item.second, item.first);
        }

        auto double_to_string = [](const double number) {
            std::stringstream ss;
            ss << std::fixed << std::setprecision(2) << number;
            return ss.str();
        };
        auto get_total_ms_time = [](Time::time_point& startTime) {
            return std::chrono::duration_cast<ns>(Time::now() - startTime).count() * 0.000001;
        };

        size_t batchSize = FLAGS_b;
        Precision precision = Precision::UNSPECIFIED;
        std::string topology_name = "";
        benchmark_app::InputsInfo app_inputs_info;
        std::string output_name;

        // Takes priority over config from file
        if (!FLAGS_cache_dir.empty()) {
            ie.SetConfig({{CONFIG_KEY(CACHE_DIR), FLAGS_cache_dir}});
        }

        if (FLAGS_load_from_file && !isNetworkCompiled) {
            next_step();
            slog::info << "Skipping the step for loading network from file" << slog::endl;
            next_step();
            slog::info << "Skipping the step for loading network from file" << slog::endl;
            next_step();
            slog::info << "Skipping the step for loading network from file" << slog::endl;
            auto startTime = Time::now();
            exeNetwork = ie.LoadNetwork(FLAGS_m, device_name);
            auto duration_ms = double_to_string(get_total_ms_time(startTime));
            slog::info << "Load network took " << duration_ms << " ms" << slog::endl;
            if (statistics)
                statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                          {{"load network time (ms)", duration_ms}});
            app_inputs_info = getInputsInfo<InputInfo::CPtr>(FLAGS_shape,
                                                             FLAGS_layout,
                                                             FLAGS_b,
                                                             FLAGS_iscale,
                                                             FLAGS_imean,
                                                             exeNetwork.GetInputsInfo());
            if (batchSize == 0) {
                batchSize = 1;
            }
        } else if (!isNetworkCompiled) {
            // ----------------- 4. Reading the Intermediate Representation network
            // ----------------------------------------
            next_step();

            slog::info << "Loading network files" << slog::endl;

            auto startTime = Time::now();
            CNNNetwork cnnNetwork = ie.ReadNetwork(FLAGS_m);
            auto duration_ms = double_to_string(get_total_ms_time(startTime));
            slog::info << "Read network took " << duration_ms << " ms" << slog::endl;
            if (statistics)
                statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                          {{"read network time (ms)", duration_ms}});

            const InputsDataMap inputInfo(cnnNetwork.getInputsInfo());
            if (inputInfo.empty()) {
                throw std::logic_error("no inputs info is provided");
            }

            // ----------------- 5. Resizing network to match image sizes and given
            // batch ----------------------------------
            next_step();
            batchSize = cnnNetwork.getBatchSize();
            // Parse input shapes if specified
            bool reshape = false;
            app_inputs_info = getInputsInfo<InputInfo::Ptr>(FLAGS_shape,
                                                            FLAGS_layout,
                                                            FLAGS_b,
                                                            FLAGS_iscale,
                                                            FLAGS_imean,
                                                            inputInfo,
                                                            reshape);
            if (reshape) {
                InferenceEngine::ICNNNetwork::InputShapes shapes = {};
                for (auto& item : app_inputs_info)
                    shapes[item.first] = item.second.shape;
                slog::info << "Reshaping network: " << getShapesString(shapes) << slog::endl;
                startTime = Time::now();
                cnnNetwork.reshape(shapes);
                duration_ms = double_to_string(get_total_ms_time(startTime));
                slog::info << "Reshape network took " << duration_ms << " ms" << slog::endl;
                if (statistics)
                    statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                              {{"reshape network time (ms)", duration_ms}});
            }
            // use batch size according to provided layout and shapes
            batchSize = (!FLAGS_layout.empty()) ? getBatchSize(app_inputs_info) : cnnNetwork.getBatchSize();

            topology_name = cnnNetwork.getName();
            slog::info << (FLAGS_b != 0 ? "Network batch size was changed to: " : "Network batch size: ") << batchSize
                       << slog::endl;

            // ----------------- 6. Configuring inputs and outputs
            // ----------------------------------------------------------------------
            next_step();

            processPrecision(cnnNetwork, FLAGS_ip, FLAGS_op, FLAGS_iop);
            for (auto& item : cnnNetwork.getInputsInfo()) {
                // if precision for input set by user, then set it to app_inputs
                // if it an image, set U8
                if (!FLAGS_ip.empty() || FLAGS_iop.find(item.first) != std::string::npos) {
                    app_inputs_info.at(item.first).precision = item.second->getPrecision();
                } else if (app_inputs_info.at(item.first).isImage()) {
                    app_inputs_info.at(item.first).precision = Precision::U8;
                    item.second->setPrecision(app_inputs_info.at(item.first).precision);
                }
            }

            printInputAndOutputsInfo(cnnNetwork);
            // ----------------- 7. Loading the model to the device
            // --------------------------------------------------------
            next_step();
            startTime = Time::now();
            exeNetwork = ie.LoadNetwork(cnnNetwork, device_name);
            duration_ms = double_to_string(get_total_ms_time(startTime));
            slog::info << "Load network took " << duration_ms << " ms" << slog::endl;
            if (statistics)
                statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                          {{"load network time (ms)", duration_ms}});
        } else {
            next_step();
            slog::info << "Skipping the step for compiled network" << slog::endl;
            next_step();
            slog::info << "Skipping the step for compiled network" << slog::endl;
            next_step();
            slog::info << "Skipping the step for compiled network" << slog::endl;
            // ----------------- 7. Loading the model to the device
            // --------------------------------------------------------
            next_step();
            auto startTime = Time::now();
            exeNetwork = ie.ImportNetwork(FLAGS_m, device_name, {});
            auto duration_ms = double_to_string(get_total_ms_time(startTime));
            slog::info << "Import network took " << duration_ms << " ms" << slog::endl;
            if (statistics)
                statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                          {{"import network time (ms)", duration_ms}});
            app_inputs_info = getInputsInfo<InputInfo::CPtr>(FLAGS_shape,
                                                             FLAGS_layout,
                                                             FLAGS_b,
                                                             FLAGS_iscale,
                                                             FLAGS_imean,
                                                             exeNetwork.GetInputsInfo());
            if (batchSize == 0) {
                batchSize = 1;
            }
        }
        // ----------------- 8. Querying optimal runtime parameters
        // -----------------------------------------------------
        next_step();
        // output of the actual settings that the device selected based on the hint
        if (!ov_perf_hint.empty()) {
            for (const auto& device : devices) {
                std::vector<std::string> supported_config_keys =
                    ie.GetMetric(device, METRIC_KEY(SUPPORTED_CONFIG_KEYS));
                slog::info << "Device: " << device << slog::endl;
                for (const auto& cfg : supported_config_keys) {
                    try {
                        slog::info << "  {" << cfg << " , " << exeNetwork.GetConfig(cfg).as<std::string>();
                    } catch (...) {
                    };
                    slog::info << " }" << slog::endl;
                }
            }
        }

        // Update number of streams
        for (auto&& ds : device_nstreams) {
            const std::string key = getDeviceTypeFromName(ds.first) + "_THROUGHPUT_STREAMS";
            device_nstreams[ds.first] = ie.GetConfig(ds.first, key).as<std::string>();
        }

        // Number of requests
        uint32_t nireq = FLAGS_nireq;
        if (nireq == 0) {
            if (FLAGS_api == "sync") {
                nireq = 1;
            } else {
                std::string key = METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS);
                try {
                    nireq = exeNetwork.GetMetric(key).as<unsigned int>();
                } catch (const std::exception& ex) {
                    IE_THROW() << "Every device used with the benchmark_app should "
                               << "support OPTIMAL_NUMBER_OF_INFER_REQUESTS "
                                  "ExecutableNetwork metric. "
                               << "Failed to query the metric for the " << device_name << " with error:" << ex.what();
                }
            }
        }

        // Iteration limit
        uint32_t niter = FLAGS_niter;
        if ((niter > 0) && (FLAGS_api == "async")) {
            niter = ((niter + nireq - 1) / nireq) * nireq;
            if (FLAGS_niter != niter) {
                slog::warn << "Number of iterations was aligned by request number from " << FLAGS_niter << " to "
                           << niter << " using number of requests " << nireq << slog::endl;
            }
        }

        // Time limit
        uint32_t duration_seconds = 0;
        if (FLAGS_t != 0) {
            // time limit
            duration_seconds = FLAGS_t;
        } else if (FLAGS_niter == 0) {
            // default time limit
            duration_seconds = deviceDefaultDeviceDurationInSeconds(device_name);
        }
        uint64_t duration_nanoseconds = getDurationInNanoseconds(duration_seconds);

        if (statistics) {
            statistics->addParameters(
                StatisticsReport::Category::RUNTIME_CONFIG,
                {
                    {"topology", topology_name},
                    {"target device", device_name},
                    {"API", FLAGS_api},
                    {"precision", std::string(precision.name())},
                    {"batch size", std::to_string(batchSize)},
                    {"number of iterations", std::to_string(niter)},
                    {"number of parallel infer requests", std::to_string(nireq)},
                    {"duration (ms)", std::to_string(getDurationInMilliseconds(duration_seconds))},
                });
            for (auto& nstreams : device_nstreams) {
                std::stringstream ss;
                ss << "number of " << nstreams.first << " streams";
                statistics->addParameters(StatisticsReport::Category::RUNTIME_CONFIG,
                                          {
                                              {ss.str(), nstreams.second},
                                          });
            }
        }

        // ----------------- 9. Creating infer requests and filling input blobs
        // ----------------------------------------
        next_step();

        InferRequestsQueue inferRequestsQueue(exeNetwork, nireq);
        if (isFlagSetInCommandLine("use_device_mem")) {
            if (device_name.find("GPU") == 0)
                ::gpu::fillRemoteBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests, exeNetwork);
            else if (device_name.find("CPU") == 0)
                fillBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests);
            else
                IE_THROW() << "Requested device doesn't support `use_device_mem` option.";
        } else {
            fillBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests);
        }

        // ----------------- 10. Measuring performance
        // ------------------------------------------------------------------
        size_t progressCnt = 0;
        size_t progressBarTotalCount = progressBarDefaultTotalCount;
        size_t iteration = 0;

        std::stringstream ss;
        ss << "Start inference " << FLAGS_api << "hronously";
        if (FLAGS_api == "async") {
            if (!ss.str().empty()) {
                ss << ", ";
            }
            ss << nireq << " inference requests";
            std::stringstream device_ss;
            for (auto& nstreams : device_nstreams) {
                if (!device_ss.str().empty()) {
                    device_ss << ", ";
                }
                device_ss << nstreams.second << " streams for " << nstreams.first;
            }
            if (!device_ss.str().empty()) {
                ss << " using " << device_ss.str();
            }
        }
        ss << ", limits: ";
        if (duration_seconds > 0) {
            ss << getDurationInMilliseconds(duration_seconds) << " ms duration";
        }
        if (niter != 0) {
            if (duration_seconds == 0) {
                progressBarTotalCount = niter;
            }
            if (duration_seconds > 0) {
                ss << ", ";
            }
            ss << niter << " iterations";
        }
        next_step(ss.str());

        // warming up - out of scope
        auto inferRequest = inferRequestsQueue.getIdleRequest();
        if (!inferRequest) {
            IE_THROW() << "No idle Infer Requests!";
        }
        if (FLAGS_api == "sync") {
            inferRequest->infer();
        } else {
            inferRequest->startAsync();
        }
        inferRequestsQueue.waitAll();
        auto duration_ms = double_to_string(inferRequestsQueue.getLatencies()[0]);
        slog::info << "First inference took " << duration_ms << " ms" << slog::endl;
        if (statistics)
            statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                      {{"first inference time (ms)", duration_ms}});
        inferRequestsQueue.resetTimes();

        auto startTime = Time::now();
        auto execTime = std::chrono::duration_cast<ns>(Time::now() - startTime).count();

        /** Start inference & calculate performance **/
        /** to align number if iterations to guarantee that last infer requests are
         * executed in the same conditions **/
        ProgressBar progressBar(progressBarTotalCount, FLAGS_stream_output, FLAGS_progress);

        while ((niter != 0LL && iteration < niter) ||
               (duration_nanoseconds != 0LL && (uint64_t)execTime < duration_nanoseconds) ||
               (FLAGS_api == "async" && iteration % nireq != 0)) {
            inferRequest = inferRequestsQueue.getIdleRequest();
            if (!inferRequest) {
                IE_THROW() << "No idle Infer Requests!";
            }

            if (FLAGS_api == "sync") {
                inferRequest->infer();
            } else {
                // As the inference request is currently idle, the wait() adds no
                // additional overhead (and should return immediately). The primary
                // reason for calling the method is exception checking/re-throwing.
                // Callback, that governs the actual execution can handle errors as
                // well, but as it uses just error codes it has no details like ‘what()’
                // method of `std::exception` So, rechecking for any exceptions here.
                inferRequest->wait();
                inferRequest->startAsync();
            }
            iteration++;

            execTime = std::chrono::duration_cast<ns>(Time::now() - startTime).count();

            if (niter > 0) {
                progressBar.addProgress(1);
            } else {
                // calculate how many progress intervals are covered by current
                // iteration. depends on the current iteration time and time of each
                // progress interval. Previously covered progress intervals must be
                // skipped.
                auto progressIntervalTime = duration_nanoseconds / progressBarTotalCount;
                size_t newProgress = execTime / progressIntervalTime - progressCnt;
                progressBar.addProgress(newProgress);
                progressCnt += newProgress;
            }
        }

        // wait the latest inference executions
        inferRequestsQueue.waitAll();

        double latency = getMedianValue<double>(inferRequestsQueue.getLatencies(), FLAGS_latency_percentile);
        double totalDuration = inferRequestsQueue.getDurationInMilliseconds();
        double fps =
            (FLAGS_api == "sync") ? batchSize * 1000.0 / latency : batchSize * 1000.0 * iteration / totalDuration;

        if (statistics) {
            statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                      {
                                          {"total execution time (ms)", double_to_string(totalDuration)},
                                          {"total number of iterations", std::to_string(iteration)},
                                      });
            if (device_name.find("MULTI") == std::string::npos) {
                std::string latency_label;
                if (FLAGS_latency_percentile == 50) {
                    latency_label = "latency (ms)";
                } else {
                    latency_label = "latency (" + std::to_string(FLAGS_latency_percentile) + " percentile) (ms)";
                }
                statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                          {
                                              {latency_label, double_to_string(latency)},
                                          });
            }
            statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                      {{"throughput", double_to_string(fps)}});
        }

        progressBar.finish();

        // ----------------- 11. Dumping statistics report
        // -------------------------------------------------------------
        next_step();

#ifdef USE_OPENCV
        if (!FLAGS_dump_config.empty()) {
            dump_config(FLAGS_dump_config, config);
            slog::info << "Inference Engine configuration settings were dumped to " << FLAGS_dump_config << slog::endl;
        }
#endif

        if (!FLAGS_exec_graph_path.empty()) {
            try {
                CNNNetwork execGraphInfo = exeNetwork.GetExecGraphInfo();
                execGraphInfo.serialize(FLAGS_exec_graph_path);
                slog::info << "executable graph is stored to " << FLAGS_exec_graph_path << slog::endl;
            } catch (const std::exception& ex) {
                slog::err << "Can't get executable graph: " << ex.what() << slog::endl;
            }
        }

        if (perf_counts) {
            std::vector<std::map<std::string, InferenceEngine::InferenceEngineProfileInfo>> perfCounts;
            for (size_t ireq = 0; ireq < nireq; ireq++) {
                auto reqPerfCounts = inferRequestsQueue.requests[ireq]->getPerformanceCounts();
                if (FLAGS_pc) {
                    slog::info << "Performance counts for " << ireq << "-th infer request:" << slog::endl;
                    printPerformanceCounts(reqPerfCounts, std::cout, getFullDeviceName(ie, FLAGS_d), false);
                }
                perfCounts.push_back(reqPerfCounts);
            }
            if (statistics) {
                statistics->dumpPerformanceCounters(perfCounts);
            }
        }

        if (statistics)
            statistics->dump();

        std::cout << "Count:      " << iteration << " iterations" << std::endl;
        std::cout << "Duration:   " << double_to_string(totalDuration) << " ms" << std::endl;
        if (device_name.find("MULTI") == std::string::npos) {
            std::cout << "Latency";
            if (FLAGS_latency_percentile == 50) {
                std::cout << ":    ";
            } else {
                std::cout << " (" << FLAGS_latency_percentile << " percentile):    ";
            }
            std::cout << double_to_string(latency) << " ms" << std::endl;
        }
        std::cout << "Throughput: " << double_to_string(fps) << " FPS" << std::endl;
    } catch (const std::exception& ex) {
        slog::err << ex.what() << slog::endl;

        if (statistics) {
            statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                      {
                                          {"error", ex.what()},
                                      });
            statistics->dump();
        }

        return 3;
    }

    return 0;
}
-												Adds support of user layouts to benchmark_app (#4002)

* Adds support of user layouts to benchmark_app

* Keep snake_case for python

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2021-02-11 12:57:05 +03:00
+								// Copyright (C) 2018-2021 Intel Corporation
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								// SPDX-License-Identifier: Apache-2.0
 								//
 								#include <algorithm>
 								#include <chrono>
-												publish master branch snapshot, revision 8d31237e2c3f673cbb0f0ba110fc10f5cce1d2bb

											
										
										
											2020-05-22 02:23:12 +03:00
+								#include <gna/gna_config.hpp>
-												[IE CLDNN] Updated GPU device config (#6040)


											
										
										
											2021-06-09 09:02:25 +03:00
+								#include <gpu/gpu_config.hpp>
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								#include <inference_engine.hpp>
 								#include <map>
 								#include <memory>
 								#include <samples/args_helper.hpp>
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								#include <samples/common.hpp>
 								#include <samples/slog.hpp>
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								#include <string>
 								#include <utility>
 								#include <vector>
 								#include <vpu/vpu_plugin_config.hpp>
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								#include "benchmark_app.hpp"
 								#include "infer_request_wrap.hpp"
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								#include "inputs_filling.hpp"
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								#include "progress_bar.hpp"
-												Add `use_device_mem` option to benchmark_app (#7433)


											
										
										
											2021-09-17 11:04:50 +03:00
+								#include "remote_blobs_filling.hpp"
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								#include "statistics_report.hpp"
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								#include "utils.hpp"
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
 								using namespace InferenceEngine;
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								static const size_t progressBarDefaultTotalCount = 1000;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								uint64_t getDurationInMilliseconds(uint32_t duration) {
 								    return duration * 1000LL;
 								}
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								uint64_t getDurationInNanoseconds(uint32_t duration) {
 								    return duration * 1000000000LL;
 								}
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								bool ParseAndCheckCommandLine(int argc, char* argv[]) {
 								    // ---------------------------Parsing and validating input
 								    // arguments--------------------------------------
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    slog::info << "Parsing input parameters" << slog::endl;
 								    gflags::ParseCommandLineNonHelpFlags(&argc, &argv, true);
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								    if (FLAGS_help || FLAGS_h) {
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        showUsage();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        showAvailableDevices();
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        return false;
 								    }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    if (FLAGS_m.empty()) {
-												Show help message when -i or -m is not set (#3144)


											
										
										
											2020-11-17 10:50:23 +03:00
+								        showUsage();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        throw std::logic_error("Model is required but not set. Please set -m option.");
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								    if (FLAGS_latency_percentile > 100 || FLAGS_latency_percentile < 1) {
 								        showUsage();
 								        throw std::logic_error("The percentile value is incorrect. The applicable values range is [1, 100].");
 								    }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    if (FLAGS_api != "async" && FLAGS_api != "sync") {
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        throw std::logic_error("Incorrect API. Please set -api option to `sync` or `async` value.");
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    }
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								    if (!FLAGS_hint.empty() && FLAGS_hint != "throughput" && FLAGS_hint != "tput" && FLAGS_hint != "latency") {
 								        throw std::logic_error("Incorrect performance hint. Please set -hint option to"
 								                               "either `throughput`(tput) or `latency' value.");
 								    }
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								    if (!FLAGS_report_type.empty() && FLAGS_report_type != noCntReport && FLAGS_report_type != averageCntReport &&
 								        FLAGS_report_type != detailedCntReport) {
 								        std::string err = "only " + std::string(noCntReport) + "/" + std::string(averageCntReport) + "/" +
 								                          std::string(detailedCntReport) +
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                          " report types are supported (invalid -report_type option value)";
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        throw std::logic_error(err);
 								    }
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								    if ((FLAGS_report_type == averageCntReport) && ((FLAGS_d.find("MULTI") != std::string::npos))) {
 								        throw std::logic_error("only " + std::string(detailedCntReport) + " report type is supported for MULTI device");
 								    }
-												Update benchmark_app to pass precision via command line (#4318)

* Update benchmark_app to pass precision via command line

* Update vpu_perfcheck

* Update python benchmark_app to support setting precision from cmd

* Review comments

* Address more review comments

* Fixes after rebase
											
										
										
											2021-03-26 15:07:59 +03:00
+								    bool isNetworkCompiled = fileExt(FLAGS_m) == "blob";
 								    bool isPrecisionSet = !(FLAGS_ip.empty() && FLAGS_op.empty() && FLAGS_iop.empty());
 								    if (isNetworkCompiled && isPrecisionSet) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								        std::string err = std::string("Cannot set precision for a compiled network. ") +
 								                          std::string("Please re-compile your network with required precision "
 								                                      "using compile_tool");
-												Update benchmark_app to pass precision via command line (#4318)

* Update benchmark_app to pass precision via command line

* Update vpu_perfcheck

* Update python benchmark_app to support setting precision from cmd

* Review comments

* Address more review comments

* Fixes after rebase
											
										
										
											2021-03-26 15:07:59 +03:00
 								        throw std::logic_error(err);
 								    }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    return true;
 								}
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								static void next_step(const std::string additional_info = "") {
 								    static size_t step_id = 0;
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								    static const std::map<size_t, std::string> step_names = {
 								        {1, "Parsing and validating input arguments"},
 								        {2, "Loading Inference Engine"},
 								        {3, "Setting device configuration"},
 								        {4, "Reading network files"},
 								        {5, "Resizing network to match image sizes and given batch"},
 								        {6, "Configuring input of the model"},
 								        {7, "Loading the model to the device"},
 								        {8, "Setting optimal runtime parameters"},
 								        {9, "Creating infer requests and filling input blobs with images"},
 								        {10, "Measuring performance"},
 								        {11, "Dumping statistics report"}};
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
 								    step_id++;
 								    if (step_names.count(step_id) == 0)
-												Used IE_THROW macro (#4869)

* Added ie throw macro

* Used IE_THROW macro
											
										
										
											2021-03-23 18:57:12 +03:00
+								        IE_THROW() << "Step ID " << step_id << " is out of total steps number " << step_names.size();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
 								    std::cout << "[Step " << step_id << "/" << step_names.size() << "] " << step_names.at(step_id)
 								              << (additional_info.empty() ? "" : " (" + additional_info + ")") << std::endl;
 								}
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								template <typename T>
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								T getMedianValue(const std::vector<T>& vec, std::size_t percentile) {
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								    std::vector<T> sortedVec(vec);
 								    std::sort(sortedVec.begin(), sortedVec.end());
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								    return sortedVec[(sortedVec.size() / 100) * percentile];
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								}
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								/**
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								 * @brief The entry point of the benchmark application
 								 */
 								int main(int argc, char* argv[]) {
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								    std::shared_ptr<StatisticsReport> statistics;
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    try {
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        ExecutableNetwork exeNetwork;
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // ----------------- 1. Parsing and validating input arguments
 								        // -------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
 								        if (!ParseAndCheckCommandLine(argc, argv)) {
 								            return 0;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        }
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        bool isNetworkCompiled = fileExt(FLAGS_m) == "blob";
 								        if (isNetworkCompiled) {
 								            slog::info << "Network is compiled" << slog::endl;
 								        }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        std::vector<gflags::CommandLineFlagInfo> flags;
 								        StatisticsReport::Parameters command_line_arguments;
 								        gflags::GetAllFlags(&flags);
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        for (auto& flag : flags) {
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            if (!flag.is_default) {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                command_line_arguments.push_back({flag.name, flag.current_value});
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								            }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        }
 								        if (!FLAGS_report_type.empty()) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								            statistics =
 								                std::make_shared<StatisticsReport>(StatisticsReport::Config{FLAGS_report_type, FLAGS_report_folder});
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								            statistics->addParameters(StatisticsReport::Category::COMMAND_LINE_PARAMETERS, command_line_arguments);
 								        }
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        auto isFlagSetInCommandLine = [&command_line_arguments](const std::string& name) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								            return (std::find_if(command_line_arguments.begin(),
 								                                 command_line_arguments.end(),
 								                                 [name](const std::pair<std::string, std::string>& p) {
 								                                     return p.first == name;
 								                                 }) != command_line_arguments.end());
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        };
 								        std::string device_name = FLAGS_d;
 								        // Parse devices
 								        auto devices = parseDevices(device_name);
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        // Parse nstreams per device
 								        std::map<std::string, std::string> device_nstreams = parseNStreamsValuePerDevice(devices, FLAGS_nstreams);
 								        // Load device config file if specified
 								        std::map<std::string, std::map<std::string, std::string>> config;
 								#ifdef USE_OPENCV
 								        if (!FLAGS_load_config.empty()) {
 								            load_config(FLAGS_load_config, config);
 								        }
 								#endif
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        /** This vector stores paths to the processed images **/
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        std::vector<std::string> inputFiles;
 								        parseInputFilesArguments(inputFiles);
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // ----------------- 2. Loading the Inference Engine
 								        // -----------------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        Core ie;
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        if (FLAGS_d.find("CPU") != std::string::npos && !FLAGS_l.empty()) {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            // CPU (MKLDNN) extensions is loaded as a shared library and passed as a
 								            // pointer to base extension
-												Removed IRelease Interface (#4032)


											
										
										
											2021-03-05 12:08:01 +03:00
+								            const auto extension_ptr = std::make_shared<InferenceEngine::Extension>(FLAGS_l);
-												publish master branch snapshot, revision 0110d9c98fd7209589d06344f0d836f61d81f4b3

											
										
										
											2020-04-27 21:21:29 +03:00
+								            ie.AddExtension(extension_ptr);
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            slog::info << "CPU (MKLDNN) extensions is loaded " << FLAGS_l << slog::endl;
-												Publishing 2019 R1.1 content and Myriad plugin sources (#162)

* Publishing 2019 R1.1 content and Myriad plugin sources
											
										
										
											2019-05-27 21:18:32 +03:00
+								        }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        // Load clDNN Extensions
-												Publishing 2019 R1.1 content and Myriad plugin sources (#162)

* Publishing 2019 R1.1 content and Myriad plugin sources
											
										
										
											2019-05-27 21:18:32 +03:00
+								        if ((FLAGS_d.find("GPU") != std::string::npos) && !FLAGS_c.empty()) {
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            // Override config if command line parameter is specified
 								            if (!config.count("GPU"))
 								                config["GPU"] = {};
 								            config["GPU"][CONFIG_KEY(CONFIG_FILE)] = FLAGS_c;
 								        }
 								        if (config.count("GPU") && config.at("GPU").count(CONFIG_KEY(CONFIG_FILE))) {
 								            auto ext = config.at("GPU").at(CONFIG_KEY(CONFIG_FILE));
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            ie.SetConfig({{CONFIG_KEY(CONFIG_FILE), ext}}, "GPU");
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            slog::info << "GPU extensions is loaded " << ext << slog::endl;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        slog::info << "InferenceEngine: " << GetInferenceEngineVersion() << slog::endl;
 								        slog::info << "Device info: " << slog::endl;
 								        std::cout << ie.GetVersions(device_name) << std::endl;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // ----------------- 3. Setting device configuration
 								        // -----------------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								        std::string ov_perf_hint;
 								        if (FLAGS_hint == "throughput" || FLAGS_hint == "tput")
 								            ov_perf_hint = CONFIG_VALUE(THROUGHPUT);
 								        else if (FLAGS_hint == "latency")
 								            ov_perf_hint = CONFIG_VALUE(LATENCY);
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
-												[GPU] Add separate config for each device (#7421)


											
										
										
											2021-10-19 16:51:38 +03:00
+								        auto getDeviceTypeFromName = [](std::string device) -> std::string {
 								            return device.substr(0, device.find_first_of(".("));
 								        };
 								        // Set default values from dumped config
 								        std::set<std::string> default_devices;
 								        for (auto& device : devices) {
 								            auto default_config = config.find(getDeviceTypeFromName(device));
 								            if (default_config != config.end()) {
 								                if (!config.count(device)) {
 								                    config[device] = default_config->second;
 								                    default_devices.emplace(default_config->first);
 								                }
 								            }
 								        }
 								        for (auto& device : default_devices) {
 								            config.erase(device);
 								        }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        bool perf_counts = false;
 								        // Update config per device according to command line parameters
 								        for (auto& device : devices) {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            if (!config.count(device))
 								                config[device] = {};
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            std::map<std::string, std::string>& device_config = config.at(device);
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								            // high-level performance modes
 								            if (!ov_perf_hint.empty()) {
 								                device_config[CONFIG_KEY(PERFORMANCE_HINT)] = ov_perf_hint;
 								                if (FLAGS_nireq != 0)
 								                    device_config[CONFIG_KEY(PERFORMANCE_HINT_NUM_REQUESTS)] = std::to_string(FLAGS_nireq);
 								            }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            // Set performance counter
 								            if (isFlagSetInCommandLine("pc")) {
 								                // set to user defined value
 								                device_config[CONFIG_KEY(PERF_COUNT)] = FLAGS_pc ? CONFIG_VALUE(YES) : CONFIG_VALUE(NO);
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								            } else if (device_config.count(CONFIG_KEY(PERF_COUNT)) &&
 								                       (device_config.at(CONFIG_KEY(PERF_COUNT)) == "YES")) {
 								                slog::warn << "Performance counters for " << device
 								                           << " device is turned on. To print results use -pc option." << slog::endl;
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            } else if (FLAGS_report_type == detailedCntReport || FLAGS_report_type == averageCntReport) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                slog::warn << "Turn on performance counters for " << device << " device since report type is "
 								                           << FLAGS_report_type << "." << slog::endl;
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                device_config[CONFIG_KEY(PERF_COUNT)] = CONFIG_VALUE(YES);
 								            } else if (!FLAGS_exec_graph_path.empty()) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                slog::warn << "Turn on performance counters for " << device << " device due to execution graph dumping."
 								                           << slog::endl;
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                device_config[CONFIG_KEY(PERF_COUNT)] = CONFIG_VALUE(YES);
 								            } else {
 								                // set to default value
 								                device_config[CONFIG_KEY(PERF_COUNT)] = FLAGS_pc ? CONFIG_VALUE(YES) : CONFIG_VALUE(NO);
-												Publishing 2020.2 content

											
										
										
											2020-04-13 21:17:23 +03:00
+								            }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            perf_counts = (device_config.at(CONFIG_KEY(PERF_COUNT)) == CONFIG_VALUE(YES)) ? true : perf_counts;
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								            // the rest are individual per-device settings (overriding the values set with perf modes)
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            auto setThroughputStreams = [&]() {
-												[GPU] Add separate config for each device (#7421)


											
										
										
											2021-10-19 16:51:38 +03:00
+								                const std::string key = getDeviceTypeFromName(device) + "_THROUGHPUT_STREAMS";
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                if (device_nstreams.count(device)) {
 								                    // set to user defined value
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                    std::vector<std::string> supported_config_keys =
 								                        ie.GetMetric(device, METRIC_KEY(SUPPORTED_CONFIG_KEYS));
 								                    if (std::find(supported_config_keys.begin(), supported_config_keys.end(), key) ==
 								                        supported_config_keys.end()) {
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                        throw std::logic_error("Device " + device + " doesn't support config key '" + key + "'! " +
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                                               "Please specify -nstreams for correct devices in format  "
 								                                               "<dev1>:<nstreams1>,<dev2>:<nstreams2>" +
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                                               " or via configuration file.");
 								                    }
 								                    device_config[key] = device_nstreams.at(device);
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								                } else if (ov_perf_hint.empty() && !device_config.count(key) && (FLAGS_api == "async")) {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                    slog::warn << "-nstreams default value is determined automatically for " << device
 								                               << " device. "
 								                                  "Although the automatic selection usually provides a "
 								                                  "reasonable performance, "
 								                                  "but it still may be non-optimal for some cases, for more "
 								                                  "information look at README."
 								                               << slog::endl;
 								                    if (std::string::npos == device.find("MYRIAD"))  // MYRIAD sets the default number of
 								                                                                     // streams implicitly (without _AUTO)
-												[GPU] Add separate config for each device (#7421)


											
										
										
											2021-10-19 16:51:38 +03:00
+								                        device_config[key] = std::string(getDeviceTypeFromName(device) + "_THROUGHPUT_AUTO");
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                }
 								                if (device_config.count(key))
 								                    device_nstreams[device] = device_config.at(key);
 								            };
-												Publishing 2020.2 content

											
										
										
											2020-04-13 21:17:23 +03:00
-												[GPU] Add separate config for each device (#7421)


											
										
										
											2021-10-19 16:51:38 +03:00
+								            if (device.find("CPU") != std::string::npos) {  // CPU supports few special performance-oriented keys
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								                // limit threading for CPU portion of inference
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                if (isFlagSetInCommandLine("nthreads"))
 								                    device_config[CONFIG_KEY(CPU_THREADS_NUM)] = std::to_string(FLAGS_nthreads);
 								                if (isFlagSetInCommandLine("enforcebf16"))
 								                    device_config[CONFIG_KEY(ENFORCE_BF16)] = FLAGS_enforcebf16 ? CONFIG_VALUE(YES) : CONFIG_VALUE(NO);
 								                if (isFlagSetInCommandLine("pin")) {
 								                    // set to user defined value
 								                    device_config[CONFIG_KEY(CPU_BIND_THREAD)] = FLAGS_pin;
 								                } else if (!device_config.count(CONFIG_KEY(CPU_BIND_THREAD))) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                    if ((device_name.find("MULTI") != std::string::npos) &&
 								                        (device_name.find("GPU") != std::string::npos)) {
 								                        slog::warn << "Turn off threads pinning for " << device
 								                                   << " device since multi-scenario with GPU device is used." << slog::endl;
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                        device_config[CONFIG_KEY(CPU_BIND_THREAD)] = CONFIG_VALUE(NO);
 								                    }
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								                }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
 								                // for CPU execution, more throughput-oriented execution via streams
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                setThroughputStreams();
-												[GPU] Add separate config for each device (#7421)


											
										
										
											2021-10-19 16:51:38 +03:00
+								            } else if (device.find("GPU") != std::string::npos) {
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                // for GPU execution, more throughput-oriented execution via streams
 								                setThroughputStreams();
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                if ((device_name.find("MULTI") != std::string::npos) &&
 								                    (device_name.find("CPU") != std::string::npos)) {
-												Typo fix (#6144)


											
										
										
											2021-06-14 22:47:59 +09:00
+								                    slog::warn << "Turn on GPU throttling. Multi-device execution with "
 								                                  "the CPU + GPU performs best with GPU throttling hint, "
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                               << "which releases another CPU thread (that is otherwise "
 								                                  "used by the GPU driver for active polling)"
 								                               << slog::endl;
-												[IE CLDNN] Updated GPU device config (#6040)


											
										
										
											2021-06-09 09:02:25 +03:00
+								                    device_config[GPU_CONFIG_KEY(PLUGIN_THROTTLE)] = "1";
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								                }
-												[GPU] Add separate config for each device (#7421)


											
										
										
											2021-10-19 16:51:38 +03:00
+								            } else if (device.find("MYRIAD") != std::string::npos) {
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                device_config[CONFIG_KEY(LOG_LEVEL)] = CONFIG_VALUE(LOG_WARNING);
-												Adding MYRIAD_THROUGHPUT_STREAMS support (#3723)

* Adding MYRIAD_THROUGHPUT_STREAMS to the list of plugin's supported config vals (omitted incorrectly) and enabing streams for the myriad devices in the benchmark_app

* docs update and python benchmark_app
											
										
										
											2020-12-29 19:02:57 +03:00
+								                setThroughputStreams();
-												[GPU] Add separate config for each device (#7421)


											
										
										
											2021-10-19 16:51:38 +03:00
+								            } else if (device.find("GNA") != std::string::npos) {
-												publish master branch snapshot, revision 8d31237e2c3f673cbb0f0ba110fc10f5cce1d2bb

											
										
										
											2020-05-22 02:23:12 +03:00
+								                if (FLAGS_qb == 8)
 								                    device_config[GNA_CONFIG_KEY(PRECISION)] = "I8";
 								                else
 								                    device_config[GNA_CONFIG_KEY(PRECISION)] = "I16";
 								                if (isFlagSetInCommandLine("nthreads"))
 								                    device_config[GNA_CONFIG_KEY(LIB_N_THREADS)] = std::to_string(FLAGS_nthreads);
-												Supported threading command line options for other devices (#2725)

* Supported thrieding command line options for ohter devices

* Fixed python benchmark
											
										
										
											2020-10-21 06:40:18 +03:00
+								            } else {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                std::vector<std::string> supported_config_keys =
 								                    ie.GetMetric(device, METRIC_KEY(SUPPORTED_CONFIG_KEYS));
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                auto supported = [&](const std::string& key) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                    return std::find(std::begin(supported_config_keys), std::end(supported_config_keys), key) !=
 								                           std::end(supported_config_keys);
-												Supported threading command line options for other devices (#2725)

* Supported thrieding command line options for ohter devices

* Fixed python benchmark
											
										
										
											2020-10-21 06:40:18 +03:00
+								                };
 								                if (supported(CONFIG_KEY(CPU_THREADS_NUM)) && isFlagSetInCommandLine("nthreads")) {
 								                    device_config[CONFIG_KEY(CPU_THREADS_NUM)] = std::to_string(FLAGS_nthreads);
 								                }
 								                if (supported(CONFIG_KEY(CPU_THROUGHPUT_STREAMS)) && isFlagSetInCommandLine("nstreams")) {
 								                    device_config[CONFIG_KEY(CPU_THROUGHPUT_STREAMS)] = FLAGS_nstreams;
 								                }
 								                if (supported(CONFIG_KEY(CPU_BIND_THREAD)) && isFlagSetInCommandLine("pin")) {
 								                    device_config[CONFIG_KEY(CPU_BIND_THREAD)] = FLAGS_pin;
 								                }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        for (auto&& item : config) {
 								            ie.SetConfig(item.second, item.first);
 								        }
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        auto double_to_string = [](const double number) {
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            std::stringstream ss;
 								            ss << std::fixed << std::setprecision(2) << number;
 								            return ss.str();
 								        };
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        auto get_total_ms_time = [](Time::time_point& startTime) {
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            return std::chrono::duration_cast<ns>(Time::now() - startTime).count() * 0.000001;
 								        };
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        size_t batchSize = FLAGS_b;
 								        Precision precision = Precision::UNSPECIFIED;
 								        std::string topology_name = "";
-												Adds support of user layouts to benchmark_app (#4002)

* Adds support of user layouts to benchmark_app

* Keep snake_case for python

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2021-02-11 12:57:05 +03:00
+								        benchmark_app::InputsInfo app_inputs_info;
 								        std::string output_name;
-												[Caching] Add caching options to benchmark app (#4909)

* Python API for LoadNetwork by model file name

* BenchmarkApp: Add caching and LoadNetworkFromFile support

    2 new options are introduced
    - cache_dir <dir> - enables models caching
    - load_from_file - use new perform "LoadNetwork" by model file name

    Using both parameters will achieve maximum performance of read/load network on startup

    Tests:
    1) Run "benchmark_app -h". Help will display 2 new options. After available devices there will be list of devices with cache support
    2) ./benchmark_app -d CPU -i <model.xml> -load_from_file
    Verify that some test steps are skipped (related to ReadNetwork, re-shaping etc)
    3) Pre-requisite: support of caching shall be enabled for Template plugin
    ./benchmark_app -d TEMPLATE -i <model.onnx> -load_from_file -cache_dir someDir
    Verify that "someDir" is created and generated blob is available
    Run again, verify that loading works as well (should be faster as it will not load onnx model)
    4) Run same test as (3), but without -load_from_file option. Verify that cache is properly created
    For some devices loadNetwork time shall be improved when cache is available

* Removed additional timing prints

* Correction from old code

* Revert "Removed additional timing prints"

Additional change - when .blob is chosen instead of .xml, it takes priority over caching flags

* Removed new time printings

As discussed, these time measurements like 'total first inference time' will be available in 'timeTests' scripts

* Fix clang-format issues
											
										
										
											2021-05-17 13:41:15 +03:00
 								        // Takes priority over config from file
 								        if (!FLAGS_cache_dir.empty()) {
 								            ie.SetConfig({{CONFIG_KEY(CACHE_DIR), FLAGS_cache_dir}});
 								        }
 								        if (FLAGS_load_from_file && !isNetworkCompiled) {
 								            next_step();
 								            slog::info << "Skipping the step for loading network from file" << slog::endl;
 								            next_step();
 								            slog::info << "Skipping the step for loading network from file" << slog::endl;
 								            next_step();
 								            slog::info << "Skipping the step for loading network from file" << slog::endl;
 								            auto startTime = Time::now();
 								            exeNetwork = ie.LoadNetwork(FLAGS_m, device_name);
 								            auto duration_ms = double_to_string(get_total_ms_time(startTime));
 								            slog::info << "Load network took " << duration_ms << " ms" << slog::endl;
 								            if (statistics)
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
 								                                          {{"load network time (ms)", duration_ms}});
-												benchmark_app incorrectly fills in the inputs for cached models (#7535)


											
										
										
											2021-09-24 11:07:14 +03:00
+								            app_inputs_info = getInputsInfo<InputInfo::CPtr>(FLAGS_shape,
 								                                                             FLAGS_layout,
 								                                                             FLAGS_b,
 								                                                             FLAGS_iscale,
 								                                                             FLAGS_imean,
 								                                                             exeNetwork.GetInputsInfo());
-												[Caching] Add caching options to benchmark app (#4909)

* Python API for LoadNetwork by model file name

* BenchmarkApp: Add caching and LoadNetworkFromFile support

    2 new options are introduced
    - cache_dir <dir> - enables models caching
    - load_from_file - use new perform "LoadNetwork" by model file name

    Using both parameters will achieve maximum performance of read/load network on startup

    Tests:
    1) Run "benchmark_app -h". Help will display 2 new options. After available devices there will be list of devices with cache support
    2) ./benchmark_app -d CPU -i <model.xml> -load_from_file
    Verify that some test steps are skipped (related to ReadNetwork, re-shaping etc)
    3) Pre-requisite: support of caching shall be enabled for Template plugin
    ./benchmark_app -d TEMPLATE -i <model.onnx> -load_from_file -cache_dir someDir
    Verify that "someDir" is created and generated blob is available
    Run again, verify that loading works as well (should be faster as it will not load onnx model)
    4) Run same test as (3), but without -load_from_file option. Verify that cache is properly created
    For some devices loadNetwork time shall be improved when cache is available

* Removed additional timing prints

* Correction from old code

* Revert "Removed additional timing prints"

Additional change - when .blob is chosen instead of .xml, it takes priority over caching flags

* Removed new time printings

As discussed, these time measurements like 'total first inference time' will be available in 'timeTests' scripts

* Fix clang-format issues
											
										
										
											2021-05-17 13:41:15 +03:00
+								            if (batchSize == 0) {
 								                batchSize = 1;
 								            }
 								        } else if (!isNetworkCompiled) {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            // ----------------- 4. Reading the Intermediate Representation network
 								            // ----------------------------------------
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            next_step();
 								            slog::info << "Loading network files" << slog::endl;
 								            auto startTime = Time::now();
 								            CNNNetwork cnnNetwork = ie.ReadNetwork(FLAGS_m);
 								            auto duration_ms = double_to_string(get_total_ms_time(startTime));
 								            slog::info << "Read network took " << duration_ms << " ms" << slog::endl;
 								            if (statistics)
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
 								                                          {{"read network time (ms)", duration_ms}});
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
 								            const InputsDataMap inputInfo(cnnNetwork.getInputsInfo());
 								            if (inputInfo.empty()) {
 								                throw std::logic_error("no inputs info is provided");
 								            }
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            // ----------------- 5. Resizing network to match image sizes and given
 								            // batch ----------------------------------
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            next_step();
-												Publishing 2020.2 content

											
										
										
											2020-04-13 21:17:23 +03:00
+								            batchSize = cnnNetwork.getBatchSize();
-												publish master branch snapshot, revision 49482ae3bea0cbaa07474f86f36db11943142687

											
										
										
											2020-05-13 21:12:22 +03:00
+								            // Parse input shapes if specified
 								            bool reshape = false;
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								            app_inputs_info = getInputsInfo<InputInfo::Ptr>(FLAGS_shape,
 								                                                            FLAGS_layout,
 								                                                            FLAGS_b,
 								                                                            FLAGS_iscale,
 								                                                            FLAGS_imean,
 								                                                            inputInfo,
 								                                                            reshape);
-												publish master branch snapshot, revision 49482ae3bea0cbaa07474f86f36db11943142687

											
										
										
											2020-05-13 21:12:22 +03:00
+								            if (reshape) {
-												Adds support of user layouts to benchmark_app (#4002)

* Adds support of user layouts to benchmark_app

* Keep snake_case for python

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2021-02-11 12:57:05 +03:00
+								                InferenceEngine::ICNNNetwork::InputShapes shapes = {};
 								                for (auto& item : app_inputs_info)
 								                    shapes[item.first] = item.second.shape;
-												publish master branch snapshot, revision 49482ae3bea0cbaa07474f86f36db11943142687

											
										
										
											2020-05-13 21:12:22 +03:00
+								                slog::info << "Reshaping network: " << getShapesString(shapes) << slog::endl;
 								                startTime = Time::now();
 								                cnnNetwork.reshape(shapes);
-												[Caching] Add caching options to benchmark app (#4909)

* Python API for LoadNetwork by model file name

* BenchmarkApp: Add caching and LoadNetworkFromFile support

    2 new options are introduced
    - cache_dir <dir> - enables models caching
    - load_from_file - use new perform "LoadNetwork" by model file name

    Using both parameters will achieve maximum performance of read/load network on startup

    Tests:
    1) Run "benchmark_app -h". Help will display 2 new options. After available devices there will be list of devices with cache support
    2) ./benchmark_app -d CPU -i <model.xml> -load_from_file
    Verify that some test steps are skipped (related to ReadNetwork, re-shaping etc)
    3) Pre-requisite: support of caching shall be enabled for Template plugin
    ./benchmark_app -d TEMPLATE -i <model.onnx> -load_from_file -cache_dir someDir
    Verify that "someDir" is created and generated blob is available
    Run again, verify that loading works as well (should be faster as it will not load onnx model)
    4) Run same test as (3), but without -load_from_file option. Verify that cache is properly created
    For some devices loadNetwork time shall be improved when cache is available

* Removed additional timing prints

* Correction from old code

* Revert "Removed additional timing prints"

Additional change - when .blob is chosen instead of .xml, it takes priority over caching flags

* Removed new time printings

As discussed, these time measurements like 'total first inference time' will be available in 'timeTests' scripts

* Fix clang-format issues
											
										
										
											2021-05-17 13:41:15 +03:00
+								                duration_ms = double_to_string(get_total_ms_time(startTime));
-												publish master branch snapshot, revision 49482ae3bea0cbaa07474f86f36db11943142687

											
										
										
											2020-05-13 21:12:22 +03:00
+								                slog::info << "Reshape network took " << duration_ms << " ms" << slog::endl;
 								                if (statistics)
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                    statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
 								                                              {{"reshape network time (ms)", duration_ms}});
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            }
-												Adds support of user layouts to benchmark_app (#4002)

* Adds support of user layouts to benchmark_app

* Keep snake_case for python

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2021-02-11 12:57:05 +03:00
+								            // use batch size according to provided layout and shapes
 								            batchSize = (!FLAGS_layout.empty()) ? getBatchSize(app_inputs_info) : cnnNetwork.getBatchSize();
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            topology_name = cnnNetwork.getName();
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								            slog::info << (FLAGS_b != 0 ? "Network batch size was changed to: " : "Network batch size: ") << batchSize
 								                       << slog::endl;
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            // ----------------- 6. Configuring inputs and outputs
 								            // ----------------------------------------------------------------------
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            next_step();
-												Fix benchmark_app to update app_inputs_info correctly (#4994)

* Fix benchmark_app to set app_inputs_info

* Keep U8 precision only for images by default

* Review fixes

* Fix a typo
											
										
										
											2021-04-01 19:20:33 +03:00
+								            processPrecision(cnnNetwork, FLAGS_ip, FLAGS_op, FLAGS_iop);
 								            for (auto& item : cnnNetwork.getInputsInfo()) {
 								                // if precision for input set by user, then set it to app_inputs
 								                // if it an image, set U8
 								                if (!FLAGS_ip.empty() || FLAGS_iop.find(item.first) != std::string::npos) {
 								                    app_inputs_info.at(item.first).precision = item.second->getPrecision();
 								                } else if (app_inputs_info.at(item.first).isImage()) {
-												Adds support of user layouts to benchmark_app (#4002)

* Adds support of user layouts to benchmark_app

* Keep snake_case for python

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2021-02-11 12:57:05 +03:00
+								                    app_inputs_info.at(item.first).precision = Precision::U8;
 								                    item.second->setPrecision(app_inputs_info.at(item.first).precision);
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								                }
 								            }
-												Update benchmark_app to pass precision via command line (#4318)

* Update benchmark_app to pass precision via command line

* Update vpu_perfcheck

* Update python benchmark_app to support setting precision from cmd

* Review comments

* Address more review comments

* Fixes after rebase
											
										
										
											2021-03-26 15:07:59 +03:00
 								            printInputAndOutputsInfo(cnnNetwork);
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            // ----------------- 7. Loading the model to the device
 								            // --------------------------------------------------------
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            next_step();
 								            startTime = Time::now();
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            exeNetwork = ie.LoadNetwork(cnnNetwork, device_name);
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            duration_ms = double_to_string(get_total_ms_time(startTime));
 								            slog::info << "Load network took " << duration_ms << " ms" << slog::endl;
 								            if (statistics)
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
 								                                          {{"load network time (ms)", duration_ms}});
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        } else {
 								            next_step();
 								            slog::info << "Skipping the step for compiled network" << slog::endl;
 								            next_step();
 								            slog::info << "Skipping the step for compiled network" << slog::endl;
 								            next_step();
 								            slog::info << "Skipping the step for compiled network" << slog::endl;
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            // ----------------- 7. Loading the model to the device
 								            // --------------------------------------------------------
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            next_step();
 								            auto startTime = Time::now();
 								            exeNetwork = ie.ImportNetwork(FLAGS_m, device_name, {});
 								            auto duration_ms = double_to_string(get_total_ms_time(startTime));
 								            slog::info << "Import network took " << duration_ms << " ms" << slog::endl;
 								            if (statistics)
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
 								                                          {{"import network time (ms)", duration_ms}});
 								            app_inputs_info = getInputsInfo<InputInfo::CPtr>(FLAGS_shape,
 								                                                             FLAGS_layout,
 								                                                             FLAGS_b,
 								                                                             FLAGS_iscale,
 								                                                             FLAGS_imean,
 								                                                             exeNetwork.GetInputsInfo());
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            if (batchSize == 0) {
 								                batchSize = 1;
 								            }
 								        }
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								        // ----------------- 8. Querying optimal runtime parameters
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // -----------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								        // output of the actual settings that the device selected based on the hint
 								        if (!ov_perf_hint.empty()) {
 								            for (const auto& device : devices) {
 								                std::vector<std::string> supported_config_keys =
 								                    ie.GetMetric(device, METRIC_KEY(SUPPORTED_CONFIG_KEYS));
 								                slog::info << "Device: " << device << slog::endl;
 								                for (const auto& cfg : supported_config_keys) {
 								                    try {
 								                        slog::info << "  {" << cfg << " , " << exeNetwork.GetConfig(cfg).as<std::string>();
 								                    } catch (...) {
 								                    };
 								                    slog::info << " }" << slog::endl;
 								                }
 								            }
 								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        // Update number of streams
 								        for (auto&& ds : device_nstreams) {
-												[GPU] Add separate config for each device (#7421)


											
										
										
											2021-10-19 16:51:38 +03:00
+								            const std::string key = getDeviceTypeFromName(ds.first) + "_THROUGHPUT_STREAMS";
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            device_nstreams[ds.first] = ie.GetConfig(ds.first, key).as<std::string>();
 								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        // Number of requests
 								        uint32_t nireq = FLAGS_nireq;
 								        if (nireq == 0) {
-												Publishing 2020.2 content

											
										
										
											2020-04-13 21:17:23 +03:00
+								            if (FLAGS_api == "sync") {
 								                nireq = 1;
 								            } else {
 								                std::string key = METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS);
 								                try {
 								                    nireq = exeNetwork.GetMetric(key).as<unsigned int>();
-												Simplified IE Exceptions Implementation (#4258)


											
										
										
											2021-03-18 16:30:16 +03:00
+								                } catch (const std::exception& ex) {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                    IE_THROW() << "Every device used with the benchmark_app should "
 								                               << "support OPTIMAL_NUMBER_OF_INFER_REQUESTS "
 								                                  "ExecutableNetwork metric. "
 								                               << "Failed to query the metric for the " << device_name << " with error:" << ex.what();
-												Publishing 2020.2 content

											
										
										
											2020-04-13 21:17:23 +03:00
+								                }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								            }
 								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        // Iteration limit
 								        uint32_t niter = FLAGS_niter;
 								        if ((niter > 0) && (FLAGS_api == "async")) {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            niter = ((niter + nireq - 1) / nireq) * nireq;
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            if (FLAGS_niter != niter) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                slog::warn << "Number of iterations was aligned by request number from " << FLAGS_niter << " to "
 								                           << niter << " using number of requests " << nireq << slog::endl;
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            }
-												Publishing R5 content (#72)

* Publishing R5 content

* Updated ade revision

* updated readme

* add possibility to build CPU plugin with Intel MKL package

											
										
										
											2019-01-21 21:31:31 +03:00
+								        }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        // Time limit
 								        uint32_t duration_seconds = 0;
 								        if (FLAGS_t != 0) {
 								            // time limit
 								            duration_seconds = FLAGS_t;
 								        } else if (FLAGS_niter == 0) {
 								            // default time limit
 								            duration_seconds = deviceDefaultDeviceDurationInSeconds(device_name);
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        uint64_t duration_nanoseconds = getDurationInNanoseconds(duration_seconds);
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								        if (statistics) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								            statistics->addParameters(
 								                StatisticsReport::Category::RUNTIME_CONFIG,
 								                {
 								                    {"topology", topology_name},
 								                    {"target device", device_name},
 								                    {"API", FLAGS_api},
 								                    {"precision", std::string(precision.name())},
 								                    {"batch size", std::to_string(batchSize)},
 								                    {"number of iterations", std::to_string(niter)},
 								                    {"number of parallel infer requests", std::to_string(nireq)},
 								                    {"duration (ms)", std::to_string(getDurationInMilliseconds(duration_seconds))},
 								                });
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								            for (auto& nstreams : device_nstreams) {
 								                std::stringstream ss;
 								                ss << "number of " << nstreams.first << " streams";
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                statistics->addParameters(StatisticsReport::Category::RUNTIME_CONFIG,
 								                                          {
 								                                              {ss.str(), nstreams.second},
 								                                          });
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								            }
 								        }
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // ----------------- 9. Creating infer requests and filling input blobs
 								        // ----------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        InferRequestsQueue inferRequestsQueue(exeNetwork, nireq);
-												Add `use_device_mem` option to benchmark_app (#7433)


											
										
										
											2021-09-17 11:04:50 +03:00
+								        if (isFlagSetInCommandLine("use_device_mem")) {
 								            if (device_name.find("GPU") == 0)
 								                ::gpu::fillRemoteBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests, exeNetwork);
 								            else if (device_name.find("CPU") == 0)
 								                fillBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests);
 								            else
 								                IE_THROW() << "Requested device doesn't support `use_device_mem` option.";
 								        } else {
 								            fillBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests);
 								        }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // ----------------- 10. Measuring performance
 								        // ------------------------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        size_t progressCnt = 0;
 								        size_t progressBarTotalCount = progressBarDefaultTotalCount;
 								        size_t iteration = 0;
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        std::stringstream ss;
-												Fix spelling errors in samples and documentation (#2795)

* Fix spelling errors in samples

* Fix spelling errors in the documentation
											
										
										
											2020-11-11 15:35:39 +03:00
+								        ss << "Start inference " << FLAGS_api << "hronously";
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        if (FLAGS_api == "async") {
 								            if (!ss.str().empty()) {
 								                ss << ", ";
 								            }
 								            ss << nireq << " inference requests";
 								            std::stringstream device_ss;
 								            for (auto& nstreams : device_nstreams) {
 								                if (!device_ss.str().empty()) {
 								                    device_ss << ", ";
 								                }
 								                device_ss << nstreams.second << " streams for " << nstreams.first;
 								            }
 								            if (!device_ss.str().empty()) {
 								                ss << " using " << device_ss.str();
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								            }
 								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        ss << ", limits: ";
 								        if (duration_seconds > 0) {
 								            ss << getDurationInMilliseconds(duration_seconds) << " ms duration";
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        if (niter != 0) {
 								            if (duration_seconds == 0) {
 								                progressBarTotalCount = niter;
 								            }
 								            if (duration_seconds > 0) {
 								                ss << ", ";
 								            }
 								            ss << niter << " iterations";
 								        }
 								        next_step(ss.str());
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        // warming up - out of scope
 								        auto inferRequest = inferRequestsQueue.getIdleRequest();
 								        if (!inferRequest) {
-												Used IE_THROW macro (#4869)

* Added ie throw macro

* Used IE_THROW macro
											
										
										
											2021-03-23 18:57:12 +03:00
+								            IE_THROW() << "No idle Infer Requests!";
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        if (FLAGS_api == "sync") {
 								            inferRequest->infer();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        } else {
 								            inferRequest->startAsync();
 								        }
 								        inferRequestsQueue.waitAll();
-												Adds first inference time measurements in benchmark_app (#1487)


											
										
										
											2020-07-27 16:45:07 +03:00
+								        auto duration_ms = double_to_string(inferRequestsQueue.getLatencies()[0]);
 								        slog::info << "First inference took " << duration_ms << " ms" << slog::endl;
 								        if (statistics)
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								            statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
 								                                      {{"first inference time (ms)", duration_ms}});
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        inferRequestsQueue.resetTimes();
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        auto startTime = Time::now();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        auto execTime = std::chrono::duration_cast<ns>(Time::now() - startTime).count();
 								        /** Start inference & calculate performance **/
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        /** to align number if iterations to guarantee that last infer requests are
 								         * executed in the same conditions **/
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        ProgressBar progressBar(progressBarTotalCount, FLAGS_stream_output, FLAGS_progress);
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								        while ((niter != 0LL && iteration < niter) ||
 								               (duration_nanoseconds != 0LL && (uint64_t)execTime < duration_nanoseconds) ||
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								               (FLAGS_api == "async" && iteration % nireq != 0)) {
 								            inferRequest = inferRequestsQueue.getIdleRequest();
 								            if (!inferRequest) {
-												Used IE_THROW macro (#4869)

* Added ie throw macro

* Used IE_THROW macro
											
										
										
											2021-03-23 18:57:12 +03:00
+								                IE_THROW() << "No idle Infer Requests!";
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            }
-												Publishing R5 content (#72)

* Publishing R5 content

* Updated ade revision

* updated readme

* add possibility to build CPU plugin with Intel MKL package

											
										
										
											2019-01-21 21:31:31 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            if (FLAGS_api == "sync") {
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								                inferRequest->infer();
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								            } else {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                // As the inference request is currently idle, the wait() adds no
 								                // additional overhead (and should return immediately). The primary
 								                // reason for calling the method is exception checking/re-throwing.
 								                // Callback, that governs the actual execution can handle errors as
 								                // well, but as it uses just error codes it has no details like ‘what()’
 								                // method of `std::exception` So, rechecking for any exceptions here.
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								                inferRequest->wait();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								                inferRequest->startAsync();
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								            }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            iteration++;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            execTime = std::chrono::duration_cast<ns>(Time::now() - startTime).count();
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            if (niter > 0) {
 								                progressBar.addProgress(1);
 								            } else {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                // calculate how many progress intervals are covered by current
 								                // iteration. depends on the current iteration time and time of each
 								                // progress interval. Previously covered progress intervals must be
 								                // skipped.
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								                auto progressIntervalTime = duration_nanoseconds / progressBarTotalCount;
 								                size_t newProgress = execTime / progressIntervalTime - progressCnt;
 								                progressBar.addProgress(newProgress);
 								                progressCnt += newProgress;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								            }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        // wait the latest inference executions
 								        inferRequestsQueue.waitAll();
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								        double latency = getMedianValue<double>(inferRequestsQueue.getLatencies(), FLAGS_latency_percentile);
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								        double totalDuration = inferRequestsQueue.getDurationInMilliseconds();
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								        double fps =
 								            (FLAGS_api == "sync") ? batchSize * 1000.0 / latency : batchSize * 1000.0 * iteration / totalDuration;
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
 								        if (statistics) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								            statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
 								                                      {
 								                                          {"total execution time (ms)", double_to_string(totalDuration)},
 								                                          {"total number of iterations", std::to_string(iteration)},
 								                                      });
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								            if (device_name.find("MULTI") == std::string::npos) {
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								                std::string latency_label;
 								                if (FLAGS_latency_percentile == 50) {
 								                    latency_label = "latency (ms)";
 								                } else {
 								                    latency_label = "latency (" + std::to_string(FLAGS_latency_percentile) + " percentile) (ms)";
 								                }
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
 								                                          {
 								                                              {latency_label, double_to_string(latency)},
 								                                          });
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								            }
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								            statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
 								                                      {{"throughput", double_to_string(fps)}});
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
 								        progressBar.finish();
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // ----------------- 11. Dumping statistics report
 								        // -------------------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								#ifdef USE_OPENCV
 								        if (!FLAGS_dump_config.empty()) {
 								            dump_config(FLAGS_dump_config, config);
 								            slog::info << "Inference Engine configuration settings were dumped to " << FLAGS_dump_config << slog::endl;
 								        }
 								#endif
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        if (!FLAGS_exec_graph_path.empty()) {
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            try {
 								                CNNNetwork execGraphInfo = exeNetwork.GetExecGraphInfo();
 								                execGraphInfo.serialize(FLAGS_exec_graph_path);
 								                slog::info << "executable graph is stored to " << FLAGS_exec_graph_path << slog::endl;
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            } catch (const std::exception& ex) {
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								                slog::err << "Can't get executable graph: " << ex.what() << slog::endl;
 								            }
 								        }
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								        if (perf_counts) {
 								            std::vector<std::map<std::string, InferenceEngine::InferenceEngineProfileInfo>> perfCounts;
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            for (size_t ireq = 0; ireq < nireq; ireq++) {
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								                auto reqPerfCounts = inferRequestsQueue.requests[ireq]->getPerformanceCounts();
 								                if (FLAGS_pc) {
-												Typo for cross-check tool (#4350)


											
										
										
											2021-02-16 13:08:54 +09:00
+								                    slog::info << "Performance counts for " << ireq << "-th infer request:" << slog::endl;
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								                    printPerformanceCounts(reqPerfCounts, std::cout, getFullDeviceName(ie, FLAGS_d), false);
 								                }
 								                perfCounts.push_back(reqPerfCounts);
 								            }
 								            if (statistics) {
 								                statistics->dumpPerformanceCounters(perfCounts);
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								        if (statistics)
 								            statistics->dump();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        std::cout << "Count:      " << iteration << " iterations" << std::endl;
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        std::cout << "Duration:   " << double_to_string(totalDuration) << " ms" << std::endl;
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								        if (device_name.find("MULTI") == std::string::npos) {
 								            std::cout << "Latency";
 								            if (FLAGS_latency_percentile == 50) {
 								                std::cout << ":    ";
 								            } else {
 								                std::cout << " (" << FLAGS_latency_percentile << " percentile):    ";
 								            }
 								            std::cout << double_to_string(latency) << " ms" << std::endl;
 								        }
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        std::cout << "Throughput: " << double_to_string(fps) << " FPS" << std::endl;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								    } catch (const std::exception& ex) {
 								        slog::err << ex.what() << slog::endl;
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
 								        if (statistics) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								            statistics->addParameters(StatisticsReport::Category::EXECUTION_RESULTS,
 								                                      {
 								                                          {"error", ex.what()},
 								                                      });
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								            statistics->dump();
 								        }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        return 3;
 								    }
 								    return 0;
 								}