openvino/samples/cpp/benchmark_app/main.cpp

// Copyright (C) 2018-2022 Intel Corporation
// SPDX-License-Identifier: Apache-2.0
//

#include <algorithm>
#include <chrono>
#include <map>
#include <memory>
#include <string>
#include <utility>
#include <vector>

// clang-format off
#include "openvino/openvino.hpp"
#include "openvino/pass/serialize.hpp"

#include "gna/gna_config.hpp"
#include "gpu/gpu_config.hpp"

#include "samples/args_helper.hpp"
#include "samples/common.hpp"
#include "samples/slog.hpp"

#include "benchmark_app.hpp"
#include "infer_request_wrap.hpp"
#include "inputs_filling.hpp"
#include "progress_bar.hpp"
#include "remote_tensors_filling.hpp"
#include "statistics_report.hpp"
#include "utils.hpp"
// clang-format on

static const size_t progressBarDefaultTotalCount = 1000;

bool parse_and_check_command_line(int argc, char* argv[]) {
    // ---------------------------Parsing and validating input
    // arguments--------------------------------------
    slog::info << "Parsing input parameters" << slog::endl;
    gflags::ParseCommandLineNonHelpFlags(&argc, &argv, true);
    if (FLAGS_help || FLAGS_h) {
        show_usage();
        showAvailableDevices();
        return false;
    }

    if (FLAGS_m.empty()) {
        show_usage();
        throw std::logic_error("Model is required but not set. Please set -m option.");
    }

    if (FLAGS_latency_percentile > 100 || FLAGS_latency_percentile < 1) {
        show_usage();
        throw std::logic_error("The percentile value is incorrect. The applicable values range is [1, 100].");
    }
    if (FLAGS_api != "async" && FLAGS_api != "sync") {
        throw std::logic_error("Incorrect API. Please set -api option to `sync` or `async` value.");
    }
    if (!FLAGS_hint.empty() && FLAGS_hint != "throughput" && FLAGS_hint != "tput" && FLAGS_hint != "latency" &&
        FLAGS_hint != "cumulative_throughput" && FLAGS_hint != "ctput" && FLAGS_hint != "none") {
        throw std::logic_error("Incorrect performance hint. Please set -hint option to"
                               "`throughput`(tput), `latency', 'cumulative_throughput'(ctput) value or 'none'.");
    }
    if (FLAGS_hint != "none" && (FLAGS_nstreams != "" || FLAGS_nthreads != 0 || FLAGS_pin != "")) {
        throw std::logic_error("-nstreams, -nthreads and -pin options are fine tune options. To use them you "
                               "should explicitely set -hint option to none. This is not OpenVINO limitation "
                               "(those options can be used in OpenVINO together), but a benchmark_app UI rule.");
    }
    if (!FLAGS_report_type.empty() && FLAGS_report_type != noCntReport && FLAGS_report_type != averageCntReport &&
        FLAGS_report_type != detailedCntReport) {
        std::string err = "only " + std::string(noCntReport) + "/" + std::string(averageCntReport) + "/" +
                          std::string(detailedCntReport) +
                          " report types are supported (invalid -report_type option value)";
        throw std::logic_error(err);
    }

    if ((FLAGS_report_type == averageCntReport) && ((FLAGS_d.find("MULTI") != std::string::npos))) {
        throw std::logic_error("only " + std::string(detailedCntReport) + " report type is supported for MULTI device");
    }

    bool isNetworkCompiled = fileExt(FLAGS_m) == "blob";
    bool isPrecisionSet = !(FLAGS_ip.empty() && FLAGS_op.empty() && FLAGS_iop.empty());
    if (isNetworkCompiled && isPrecisionSet) {
        std::string err = std::string("Cannot set precision for a compiled network. ") +
                          std::string("Please re-compile your network with required precision "
                                      "using compile_tool");

        throw std::logic_error(err);
    }
    return true;
}

static void next_step(const std::string additional_info = "") {
    static size_t step_id = 0;
    static const std::map<size_t, std::string> step_names = {
        {1, "Parsing and validating input arguments"},
        {2, "Loading OpenVINO Runtime"},
        {3, "Setting device configuration"},
        {4, "Reading network files"},
        {5, "Resizing network to match image sizes and given batch"},
        {6, "Configuring input of the model"},
        {7, "Loading the model to the device"},
        {8, "Setting optimal runtime parameters"},
        {9, "Creating infer requests and preparing input blobs with data"},
        {10, "Measuring performance"},
        {11, "Dumping statistics report"}};

    step_id++;

    OPENVINO_ASSERT(step_names.count(step_id) != 0,
                    "Step ID ",
                    step_id,
                    " is out of total steps number ",
                    step_names.size());

    std::cout << "[Step " << step_id << "/" << step_names.size() << "] " << step_names.at(step_id)
              << (additional_info.empty() ? "" : " (" + additional_info + ")") << std::endl;
}

ov::hint::PerformanceMode get_performance_hint(const std::string& device, const ov::Core& core) {
    ov::hint::PerformanceMode ov_perf_hint = ov::hint::PerformanceMode::UNDEFINED;
    auto supported_properties = core.get_property(device, ov::supported_properties);
    if (std::find(supported_properties.begin(), supported_properties.end(), ov::hint::performance_mode) !=
        supported_properties.end()) {
        if (FLAGS_hint != "") {
            if (FLAGS_hint == "throughput" || FLAGS_hint == "tput") {
                slog::warn << "Device(" << device << ") performance hint is set to THROUGHPUT" << slog::endl;
                ov_perf_hint = ov::hint::PerformanceMode::THROUGHPUT;
            } else if (FLAGS_hint == "latency") {
                slog::warn << "Device(" << device << ") performance hint is set to LATENCY" << slog::endl;
                ov_perf_hint = ov::hint::PerformanceMode::LATENCY;
            } else if (FLAGS_hint == "cumulative_throughput" || FLAGS_hint == "ctput") {
                slog::warn << "Device(" << device << ") performance hint is set to CUMULATIVE_THROUGHPUT" << slog::endl;
                ov_perf_hint = ov::hint::PerformanceMode::CUMULATIVE_THROUGHPUT;
            } else if (FLAGS_hint == "none") {
                slog::warn << "No device(" << device << ") performance hint is set" << slog::endl;
                ov_perf_hint = ov::hint::PerformanceMode::UNDEFINED;
            }
        } else {
            ov_perf_hint =
                FLAGS_api == "sync" ? ov::hint::PerformanceMode::LATENCY : ov::hint::PerformanceMode::THROUGHPUT;

            slog::warn << "Performance hint was not explicitly specified in command line. "
                          "Device("
                       << device << ") performance hint will be set to " << ov_perf_hint << "." << slog::endl;
        }
    } else {
        if (FLAGS_hint != "") {
            slog::warn << "Device(" << device << ") does not support performance hint property(-hint)." << slog::endl;
        }
    }
    return ov_perf_hint;
}

/**
 * @brief The entry point of the benchmark application
 */
int main(int argc, char* argv[]) {
    std::shared_ptr<StatisticsReport> statistics;
    try {
        ov::CompiledModel compiledModel;

        // ----------------- 1. Parsing and validating input arguments
        // -------------------------------------------------
        next_step();

        if (!parse_and_check_command_line(argc, argv)) {
            return 0;
        }

        bool isNetworkCompiled = fileExt(FLAGS_m) == "blob";
        if (isNetworkCompiled) {
            slog::info << "Network is compiled" << slog::endl;
        }

        std::vector<gflags::CommandLineFlagInfo> flags;
        StatisticsReport::Parameters command_line_arguments;
        gflags::GetAllFlags(&flags);
        for (auto& flag : flags) {
            if (!flag.is_default) {
                command_line_arguments.emplace_back(flag.name, flag.name, flag.current_value);
            }
        }
        if (!FLAGS_report_type.empty()) {
            statistics = FLAGS_json_stats ? std::make_shared<StatisticsReportJSON>(
                                                StatisticsReport::Config{FLAGS_report_type, FLAGS_report_folder})
                                          : std::make_shared<StatisticsReport>(
                                                StatisticsReport::Config{FLAGS_report_type, FLAGS_report_folder});

            statistics->add_parameters(StatisticsReport::Category::COMMAND_LINE_PARAMETERS, command_line_arguments);
        }
        auto isFlagSetInCommandLine = [&command_line_arguments](const std::string& name) {
            return (std::find_if(command_line_arguments.begin(),
                                 command_line_arguments.end(),
                                 [name](const StatisticsVariant& p) {
                                     return p.json_name == name;
                                 }) != command_line_arguments.end());
        };

        std::string device_name = FLAGS_d;

        // Parse devices
        auto devices = parse_devices(device_name);

        // Parse nstreams per device
        std::map<std::string, std::string> device_nstreams = parse_value_per_device(devices, FLAGS_nstreams);
        std::map<std::string, std::string> device_infer_precision =
            parse_value_per_device(devices, FLAGS_infer_precision);

        // Load device config file if specified
        std::map<std::string, ov::AnyMap> config;
        if (!FLAGS_load_config.empty()) {
            load_config(FLAGS_load_config, config);
        }

        /** This vector stores paths to the processed images with input names**/
        auto inputFiles = parse_input_arguments(gflags::GetArgvs());

        // ----------------- 2. Loading the OpenVINO Runtime
        // -----------------------------------------------------------
        next_step();

        ov::Core core;

        if (!FLAGS_extensions.empty()) {
            // Extensions are loaded as a shared library
            core.add_extension(FLAGS_extensions);
            slog::info << "Extensions are loaded: " << FLAGS_extensions << slog::endl;
        }

        // Load clDNN Extensions
        if ((FLAGS_d.find("GPU") != std::string::npos) && !FLAGS_c.empty()) {
            // Override config if command line parameter is specified
            if (!config.count("GPU"))
                config["GPU"] = {};
            config["GPU"][CONFIG_KEY(CONFIG_FILE)] = FLAGS_c;
        }
        if (config.count("GPU") && config.at("GPU").count(CONFIG_KEY(CONFIG_FILE))) {
            auto ext = config.at("GPU").at(CONFIG_KEY(CONFIG_FILE)).as<std::string>();
            core.set_property("GPU", {{CONFIG_KEY(CONFIG_FILE), ext}});
            slog::info << "GPU extensions are loaded: " << ext << slog::endl;
        }

        slog::info << "OpenVINO: " << ov::get_openvino_version() << slog::endl;
        slog::info << "Device info: " << slog::endl;
        slog::info << core.get_versions(device_name) << slog::endl;

        // ----------------- 3. Setting device configuration
        // -----------------------------------------------------------
        next_step();

        auto getDeviceTypeFromName = [](std::string device) -> std::string {
            return device.substr(0, device.find_first_of(".("));
        };

        // Set default values from dumped config
        std::set<std::string> default_devices;
        for (auto& device : devices) {
            auto default_config = config.find(getDeviceTypeFromName(device));
            if (default_config != config.end()) {
                if (!config.count(device)) {
                    config[device] = default_config->second;
                    default_devices.emplace(default_config->first);
                }
            }
        }
        for (auto& device : default_devices) {
            config.erase(device);
        }

        bool perf_counts = false;
        // check if using the virtual device
        auto if_auto = std::find(devices.begin(), devices.end(), "AUTO") != devices.end();
        auto if_multi = std::find(devices.begin(), devices.end(), "MULTI") != devices.end();
        // Remove the hardware devices if AUTO/MULTI appears in the devices list.
        if (if_auto || if_multi) {
            devices.clear();
            std::string virtual_device;
            if (if_auto) {
                virtual_device = "AUTO";
                devices.push_back("AUTO");
            }
            if (if_multi) {
                virtual_device = "MULTI";
                devices.push_back("MULTI");
            }
            parse_value_for_virtual_device(virtual_device, device_nstreams);
            parse_value_for_virtual_device(virtual_device, device_infer_precision);
        }
        // Update config per device according to command line parameters
        for (auto& device : devices) {
            auto& device_config = config[device];

            // high-level performance modes
            auto ov_perf_hint = get_performance_hint(device, core);
            if (ov_perf_hint != ov::hint::PerformanceMode::UNDEFINED) {
                device_config.emplace(ov::hint::performance_mode(ov_perf_hint));
                if (FLAGS_nireq != 0)
                    device_config.emplace(ov::hint::num_requests(FLAGS_nireq));
            }

            // Set performance counter
            if (isFlagSetInCommandLine("pc")) {
                // set to user defined value
                device_config.emplace(ov::enable_profiling(FLAGS_pc));
            } else if (device_config.count(ov::enable_profiling.name()) &&
                       (device_config.at(ov::enable_profiling.name()).as<bool>())) {
                slog::warn << "Performance counters for " << device
                           << " device is turned on. To print results use -pc option." << slog::endl;
            } else if (FLAGS_report_type == detailedCntReport || FLAGS_report_type == averageCntReport) {
                slog::warn << "Turn on performance counters for " << device << " device since report type is "
                           << FLAGS_report_type << "." << slog::endl;
                device_config.emplace(ov::enable_profiling(true));
            } else if (!FLAGS_exec_graph_path.empty()) {
                slog::warn << "Turn on performance counters for " << device << " device due to execution graph dumping."
                           << slog::endl;
                device_config.emplace(ov::enable_profiling(true));
            } else {
                // set to default value
                device_config.emplace(ov::enable_profiling(FLAGS_pc));
            }
            perf_counts = (device_config.at(ov::enable_profiling.name()).as<bool>()) ? true : perf_counts;

            auto supported_properties = core.get_property(device, ov::supported_properties);

            auto supported = [&](const std::string& key) {
                return std::find(std::begin(supported_properties), std::end(supported_properties), key) !=
                       std::end(supported_properties);
            };
            // the rest are individual per-device settings (overriding the values set with perf modes)
            auto setThroughputStreams = [&]() {
                std::string key = getDeviceTypeFromName(device) + "_THROUGHPUT_STREAMS";
                auto it_device_nstreams = device_nstreams.find(device);
                if (it_device_nstreams != device_nstreams.end()) {
                    // set to user defined value
                    if (supported(key)) {
                        device_config[key] = it_device_nstreams->second;
                    } else if (supported(ov::num_streams.name())) {
                        // Use API 2.0 key for streams
                        key = ov::num_streams.name();
                        device_config[key] = it_device_nstreams->second;
                    } else if (device == "MULTI" || device == "AUTO") {
                        // check if the element contains the hardware device property
                        auto value_vec = split(it_device_nstreams->second, ' ');
                        if (value_vec.size() == 1) {
                            key = ov::num_streams.name();
                            device_config[key] = it_device_nstreams->second;
                        } else {
                            // set device nstreams properties in the AUTO/MULTI plugin
                            std::stringstream strm(it_device_nstreams->second);
                            std::map<std::string, std::string> devices_property;
                            ov::util::Read<std::map<std::string, std::string>>{}(strm, devices_property);
                            for (auto it : devices_property) {
                                device_config.insert(
                                    ov::device::properties(it.first, ov::num_streams(std::stoi(it.second))));
                            }
                        }
                    } else {
                        throw std::logic_error("Device " + device + " doesn't support config key '" + key + "' " +
                                               "and '" + ov::num_streams.name() + "'!" +
                                               "Please specify -nstreams for correct devices in format  "
                                               "<dev1>:<nstreams1>,<dev2>:<nstreams2>" +
                                               " or via configuration file.");
                    }
                } else if (ov_perf_hint == ov::hint::PerformanceMode::UNDEFINED && !device_config.count(key) &&
                           (FLAGS_api == "async")) {
                    slog::warn << "-nstreams default value is determined automatically for " << device
                               << " device. "
                                  "Although the automatic selection usually provides a "
                                  "reasonable performance, "
                                  "but it still may be non-optimal for some cases, for more "
                                  "information look at README."
                               << slog::endl;
                    if (std::string::npos == device.find("MYRIAD")) {  // MYRIAD sets the default number of
                                                                       // streams implicitly (without _AUTO)
                        if (supported(key)) {
                            device_config[key] = std::string(getDeviceTypeFromName(device) + "_THROUGHPUT_AUTO");
                        } else if (supported(ov::num_streams.name())) {
                            // Use API 2.0 key for streams
                            key = ov::num_streams.name();
                            device_config[key] = ov::streams::AUTO;
                        }
                    }
                }
                auto it_streams = device_config.find(ov::num_streams.name());
                if (it_streams != device_config.end())
                    device_nstreams[device] = it_streams->second.as<std::string>();
            };

            auto set_infer_precision = [&] {
                auto it_device_infer_precision = device_infer_precision.find(device);
                if (it_device_infer_precision != device_infer_precision.end()) {
                    // set to user defined value
                    if (!supported(ov::hint::inference_precision.name())) {
                        throw std::logic_error("Device " + device + " doesn't support config key '" +
                                               ov::hint::inference_precision.name() + "'! " +
                                               "Please specify -infer_precision for correct devices in format  "
                                               "<dev1>:<infer_precision1>,<dev2>:<infer_precision2>" +
                                               " or via configuration file.");
                    }
                    device_config.emplace(ov::hint::inference_precision(it_device_infer_precision->second));
                }
            };

            auto fix_pin_option = [](const std::string& str) -> std::string {
                if (str == "NO")
                    return "NONE";
                else if (str == "YES")
                    return "CORE";
                else
                    return str;
            };

            if (supported(ov::inference_num_threads.name()) && isFlagSetInCommandLine("nthreads")) {
                device_config.emplace(ov::inference_num_threads(FLAGS_nthreads));
            }
            if (supported(ov::affinity.name()) && isFlagSetInCommandLine("pin")) {
                device_config.emplace(ov::affinity(fix_pin_option(FLAGS_pin)));
            }

            if (device.find("CPU") != std::string::npos || device.find("GPU") != std::string::npos) {
                // CPU supports few special performance-oriented keys
                // for CPU and GPU execution, more throughput-oriented execution via streams
                setThroughputStreams();
                set_infer_precision();
            } else if (device.find("MYRIAD") != std::string::npos) {
                device_config.emplace(ov::log::level(ov::log::Level::WARNING));
                setThroughputStreams();
            } else if (device.find("GNA") != std::string::npos) {
                set_infer_precision();
            } else if (device.find("AUTO") != std::string::npos) {
                setThroughputStreams();
                set_infer_precision();
                device_nstreams.erase(device);
            } else if (device.find("MULTI") != std::string::npos) {
                setThroughputStreams();
                set_infer_precision();
                if ((device_name.find("GPU") != std::string::npos) && (device_name.find("CPU") != std::string::npos)) {
                    slog::warn << "GPU throttling is turned on. Multi-device execution with "
                                  "the CPU + GPU performs best with GPU throttling hint, "
                               << "which releases another CPU thread (that is otherwise "
                                  "used by the GPU driver for active polling)."
                               << slog::endl;

                    device_config.insert(ov::device::properties("GPU", {{GPU_CONFIG_KEY(PLUGIN_THROTTLE), 1}}));
                    // limit threading for CPU portion of inference
                    if (!isFlagSetInCommandLine("pin")) {
                        auto it_affinity = device_config.find(ov::affinity.name());
                        if (it_affinity != device_config.end()) {
                            slog::warn << "Turn off threads pinning for " << device
                                       << " device since multi-scenario with GPU device is used." << slog::endl;
                            it_affinity->second = ov::Affinity::NONE;
                        }
                    }
                }
                device_nstreams.erase(device);
            }
        }

        for (auto&& item : config) {
            core.set_property(item.first, item.second);
        }

        size_t batchSize = FLAGS_b;
        ov::element::Type type = ov::element::undefined;
        std::string topology_name = "";
        std::vector<benchmark_app::InputsInfo> app_inputs_info;
        std::string output_name;

        // Takes priority over config from file
        if (!FLAGS_cache_dir.empty()) {
            core.set_property(ov::cache_dir(FLAGS_cache_dir));
        }

        // If set batch size, disable the auto batching
        if (FLAGS_b > 0) {
            core.set_property(ov::hint::allow_auto_batching(false));
        }

        bool isDynamicNetwork = false;

        if (FLAGS_load_from_file && !isNetworkCompiled) {
            next_step();
            slog::info << "Skipping the step for loading network from file" << slog::endl;
            next_step();
            slog::info << "Skipping the step for loading network from file" << slog::endl;
            next_step();
            slog::info << "Skipping the step for loading network from file" << slog::endl;
            auto startTime = Time::now();
            compiledModel = core.compile_model(FLAGS_m, device_name);
            auto duration_ms = get_duration_ms_till_now(startTime);
            slog::info << "Load network took " << double_to_string(duration_ms) << " ms" << slog::endl;
            slog::info << "Original network I/O parameters:" << slog::endl;
            printInputAndOutputsInfoShort(compiledModel);

            if (statistics)
                statistics->add_parameters(
                    StatisticsReport::Category::EXECUTION_RESULTS,
                    {StatisticsVariant("load network time (ms)", "load_network_time", duration_ms)});

            convert_io_names_in_map(inputFiles, compiledModel.inputs());
            app_inputs_info = get_inputs_info(FLAGS_shape,
                                              FLAGS_layout,
                                              batchSize,
                                              FLAGS_data_shape,
                                              inputFiles,
                                              FLAGS_iscale,
                                              FLAGS_imean,
                                              compiledModel.inputs());
            if (batchSize == 0) {
                batchSize = 1;
            }

        } else if (!isNetworkCompiled) {
            // ----------------- 4. Reading the Intermediate Representation network
            // ----------------------------------------
            next_step();

            slog::info << "Loading network files" << slog::endl;

            auto startTime = Time::now();
            auto model = core.read_model(FLAGS_m);
            auto duration_ms = get_duration_ms_till_now(startTime);
            slog::info << "Read network took " << double_to_string(duration_ms) << " ms" << slog::endl;
            slog::info << "Original network I/O parameters:" << slog::endl;
            printInputAndOutputsInfoShort(*model);

            if (statistics)
                statistics->add_parameters(
                    StatisticsReport::Category::EXECUTION_RESULTS,
                    {StatisticsVariant("read network time (ms)", "read_network_time", duration_ms)});

            const auto& inputInfo = std::const_pointer_cast<const ov::Model>(model)->inputs();
            if (inputInfo.empty()) {
                throw std::logic_error("no inputs info is provided");
            }

            // ----------------- 5. Resizing network to match image sizes and given
            // batch ----------------------------------
            for (auto& item : model->inputs()) {
                if (item.get_tensor().get_names().empty()) {
                    item.get_tensor_ptr()->set_names(
                        std::unordered_set<std::string>{item.get_node_shared_ptr()->get_name()});
                }
            }
            next_step();
            convert_io_names_in_map(inputFiles, std::const_pointer_cast<const ov::Model>(model)->inputs());
            // Parse input shapes if specified
            bool reshape = false;
            app_inputs_info = get_inputs_info(FLAGS_shape,
                                              FLAGS_layout,
                                              FLAGS_b,
                                              FLAGS_data_shape,
                                              inputFiles,
                                              FLAGS_iscale,
                                              FLAGS_imean,
                                              inputInfo,
                                              reshape);
            if (reshape) {
                benchmark_app::PartialShapes shapes = {};
                for (auto& item : app_inputs_info[0])
                    shapes[item.first] = item.second.partialShape;
                slog::info << "Reshaping network: " << get_shapes_string(shapes) << slog::endl;
                startTime = Time::now();
                model->reshape(shapes);
                duration_ms = get_duration_ms_till_now(startTime);
                slog::info << "Reshape network took " << double_to_string(duration_ms) << " ms" << slog::endl;
                if (statistics)
                    statistics->add_parameters(
                        StatisticsReport::Category::EXECUTION_RESULTS,
                        {StatisticsVariant("reshape network time (ms)", "reshape_network_time", duration_ms)});
            }

            // ----------------- 6. Configuring inputs and outputs
            // ----------------------------------------------------------------------
            next_step();
            auto preproc = ov::preprocess::PrePostProcessor(model);

            std::map<std::string, std::string> user_precisions_map;
            if (!FLAGS_iop.empty()) {
                user_precisions_map = parseArgMap(FLAGS_iop);
                convert_io_names_in_map(user_precisions_map,
                                        std::const_pointer_cast<const ov::Model>(model)->inputs(),
                                        std::const_pointer_cast<const ov::Model>(model)->outputs());
            }

            const auto input_precision = FLAGS_ip.empty() ? ov::element::undefined : getPrecision2(FLAGS_ip);
            const auto output_precision = FLAGS_op.empty() ? ov::element::undefined : getPrecision2(FLAGS_op);

            const auto& inputs = model->inputs();
            for (int i = 0; i < inputs.size(); i++) {
                const auto& item = inputs[i];
                auto iop_precision = ov::element::undefined;
                auto type_to_set = ov::element::undefined;
                std::string name;
                try {
                    // Some tensors might have no names, get_any_name will throw exception in that case.
                    // -iop option will not work for those tensors.
                    name = item.get_any_name();
                    iop_precision = getPrecision2(user_precisions_map.at(item.get_any_name()));
                } catch (...) {
                }

                if (iop_precision != ov::element::undefined) {
                    type_to_set = iop_precision;
                } else if (input_precision != ov::element::undefined) {
                    type_to_set = input_precision;
                } else if (!name.empty() && app_inputs_info[0].at(name).is_image()) {
                    // image input, set U8
                    type_to_set = ov::element::u8;
                }

                auto& in = preproc.input(item.get_any_name());
                if (type_to_set != ov::element::undefined) {
                    in.tensor().set_element_type(type_to_set);

                    if (!name.empty()) {
                        for (auto& info : app_inputs_info) {
                            info.at(name).type = type_to_set;
                        }
                    }
                }
                // Explicitly set inputs layout.
                if (!name.empty() && !app_inputs_info[0].at(name).layout.empty()) {
                    in.model().set_layout(app_inputs_info[0].at(name).layout);
                }
            }

            const auto& outs = model->outputs();
            for (int i = 0; i < outs.size(); i++) {
                const auto& item = outs[i];
                auto iop_precision = ov::element::undefined;
                try {
                    // Some tensors might have no names, get_any_name will throw exception in that case.
                    // -iop option will not work for those tensors.
                    iop_precision = getPrecision2(user_precisions_map.at(item.get_any_name()));
                } catch (...) {
                }

                if (iop_precision != ov::element::undefined) {
                    preproc.output(i).tensor().set_element_type(iop_precision);
                } else if (output_precision != ov::element::undefined) {
                    preproc.output(i).tensor().set_element_type(output_precision);
                }
            }

            model = preproc.build();

            // Check if network has dynamic shapes
            auto input_info = app_inputs_info[0];
            isDynamicNetwork = std::any_of(input_info.begin(),
                                           input_info.end(),
                                           [](const std::pair<std::string, benchmark_app::InputInfo>& i) {
                                               return i.second.partialShape.is_dynamic();
                                           });

            topology_name = model->get_friendly_name();

            // Calculate batch size according to provided layout and shapes (static case)
            if (!isDynamicNetwork && app_inputs_info.size()) {
                batchSize = get_batch_size(app_inputs_info.front());

                slog::info << "Network batch size: " << batchSize << slog::endl;
            } else if (batchSize == 0) {
                batchSize = 1;
            }

            printInputAndOutputsInfoShort(*model);
            // ----------------- 7. Loading the model to the device
            // --------------------------------------------------------
            next_step();
            startTime = Time::now();
            compiledModel = core.compile_model(model, device_name);
            duration_ms = get_duration_ms_till_now(startTime);
            slog::info << "Load network took " << double_to_string(duration_ms) << " ms" << slog::endl;
            if (statistics)
                statistics->add_parameters(
                    StatisticsReport::Category::EXECUTION_RESULTS,
                    {StatisticsVariant("load network time (ms)", "load_network_time", duration_ms)});
        } else {
            next_step();
            slog::info << "Skipping the step for compiled network" << slog::endl;
            next_step();
            slog::info << "Skipping the step for compiled network" << slog::endl;
            next_step();
            slog::info << "Skipping the step for compiled network" << slog::endl;
            // ----------------- 7. Loading the model to the device
            // --------------------------------------------------------
            next_step();
            auto startTime = Time::now();

            std::ifstream modelStream(FLAGS_m, std::ios_base::binary | std::ios_base::in);
            if (!modelStream.is_open()) {
                throw std::runtime_error("Cannot open model file " + FLAGS_m);
            }
            compiledModel = core.import_model(modelStream, device_name, {});
            modelStream.close();

            auto duration_ms = get_duration_ms_till_now(startTime);
            slog::info << "Import network took " << double_to_string(duration_ms) << " ms" << slog::endl;
            slog::info << "Original network I/O paramteters:" << slog::endl;
            printInputAndOutputsInfoShort(compiledModel);

            if (statistics)
                statistics->add_parameters(
                    StatisticsReport::Category::EXECUTION_RESULTS,
                    {StatisticsVariant("import network time (ms)", "import_network_time", duration_ms)});

            convert_io_names_in_map(inputFiles, compiledModel.inputs());
            app_inputs_info = get_inputs_info(FLAGS_shape,
                                              FLAGS_layout,
                                              FLAGS_b,
                                              FLAGS_data_shape,
                                              inputFiles,
                                              FLAGS_iscale,
                                              FLAGS_imean,
                                              compiledModel.inputs());
            if (batchSize == 0) {
                batchSize = 1;
            }
        }

        if (isDynamicNetwork && FLAGS_api == "sync") {
            throw std::logic_error("Benchmarking of the model with dynamic shapes is available for async API only."
                                   "Please use -api async -nstreams 1 -nireq 1 to emulate sync behavior");
        }

        // Defining of benchmark mode
        // for static models inference only mode is used as default one
        bool inferenceOnly = FLAGS_inference_only;
        if (isDynamicNetwork) {
            if (isFlagSetInCommandLine("inference_only") && inferenceOnly && app_inputs_info.size() != 1) {
                throw std::logic_error(
                    "Dynamic models with different input data shapes must be benchmarked only in full mode.");
            }
            inferenceOnly = isFlagSetInCommandLine("inference_only") && inferenceOnly && app_inputs_info.size() == 1;
        }

        // ----------------- 8. Querying optimal runtime parameters
        // -----------------------------------------------------
        next_step();
        // output of the actual settings that the device selected
        for (const auto& device : devices) {
            auto supported_properties = compiledModel.get_property(ov::supported_properties);
            slog::info << "Device: " << device << slog::endl;
            for (const auto& cfg : supported_properties) {
                try {
                    if (cfg == ov::supported_properties)
                        continue;

                    auto prop = compiledModel.get_property(cfg);
                    slog::info << "  { " << cfg << " , " << prop.as<std::string>() << " }" << slog::endl;
                } catch (const ov::Exception&) {
                }
            }
        }

        // Update number of streams
        for (auto&& ds : device_nstreams) {
            try {
                const std::string key = getDeviceTypeFromName(ds.first) + "_THROUGHPUT_STREAMS";
                device_nstreams[ds.first] = core.get_property(ds.first, key).as<std::string>();
            } catch (const ov::Exception&) {
                device_nstreams[ds.first] = core.get_property(ds.first, ov::num_streams.name()).as<std::string>();
            }
        }

        // Number of requests
        uint32_t nireq = FLAGS_nireq;
        if (nireq == 0) {
            if (FLAGS_api == "sync") {
                nireq = 1;
            } else {
                try {
                    nireq = compiledModel.get_property(ov::optimal_number_of_infer_requests);
                } catch (const std::exception& ex) {
                    throw ov::Exception("Every device used with the benchmark_app should support " +
                                        std::string(ov::optimal_number_of_infer_requests.name()) +
                                        " Failed to query the metric for the " + device_name +
                                        " with error:" + ex.what());
                }
            }
        }

        // Iteration limit
        uint32_t niter = FLAGS_niter;
        size_t shape_groups_num = app_inputs_info.size();
        if ((niter > 0) && (FLAGS_api == "async")) {
            if (shape_groups_num > nireq) {
                niter = ((niter + shape_groups_num - 1) / shape_groups_num) * shape_groups_num;
                if (FLAGS_niter != niter) {
                    slog::warn << "Number of iterations was aligned by data shape groups number from " << FLAGS_niter
                               << " to " << niter << " using number of possible input shapes " << shape_groups_num
                               << slog::endl;
                }
            } else {
                niter = ((niter + nireq - 1) / nireq) * nireq;
                if (FLAGS_niter != niter) {
                    slog::warn << "Number of iterations was aligned by request number from " << FLAGS_niter << " to "
                               << niter << " using number of requests " << nireq << slog::endl;
                }
            }
        }

        // Time limit
        uint32_t duration_seconds = 0;
        if (FLAGS_t != 0) {
            // time limit
            duration_seconds = FLAGS_t;
        } else if (FLAGS_niter == 0) {
            // default time limit
            duration_seconds = device_default_device_duration_in_seconds(device_name);
        }
        uint64_t duration_nanoseconds = get_duration_in_nanoseconds(duration_seconds);

        if (statistics) {
            statistics->add_parameters(
                StatisticsReport::Category::RUNTIME_CONFIG,
                StatisticsReport::Parameters(
                    {StatisticsVariant("benchmark mode", "benchmark_mode", inferenceOnly ? "inference only" : "full"),
                     StatisticsVariant("topology", "topology", topology_name),
                     StatisticsVariant("target device", "target_device", device_name),
                     StatisticsVariant("API", "api", FLAGS_api),
                     StatisticsVariant("precision", "precision", type.get_type_name()),
                     StatisticsVariant("batch size", "batch_size", batchSize),
                     StatisticsVariant("number of iterations", "iterations_num", niter),
                     StatisticsVariant("number of parallel infer requests", "nireq", nireq),
                     StatisticsVariant("duration (ms)", "duration", get_duration_in_milliseconds(duration_seconds))}));
            for (auto& nstreams : device_nstreams) {
                std::stringstream ss;
                ss << "number of " << nstreams.first << " streams";

                std::string dev_name = nstreams.first;
                std::transform(dev_name.begin(), dev_name.end(), dev_name.begin(), [](unsigned char c) {
                    return c == ' ' ? '_' : std::tolower(c);
                });

                statistics->add_parameters(StatisticsReport::Category::RUNTIME_CONFIG,
                                           {StatisticsVariant(ss.str(), dev_name + "_streams_num", nstreams.second)});
            }
        }

        // ----------------- 9. Creating infer requests and filling input blobs
        // ----------------------------------------
        next_step();

        InferRequestsQueue inferRequestsQueue(compiledModel, nireq, app_inputs_info.size(), FLAGS_pcseq);

        bool inputHasName = false;
        if (inputFiles.size() > 0) {
            inputHasName = inputFiles.begin()->first != "";
        }
        bool newInputType = isDynamicNetwork || inputHasName;
        // create vector to store remote input blobs buffer
        std::vector<::gpu::BufferType> clInputsBuffer;
        bool useGpuMem = false;

        std::map<std::string, ov::TensorVector> inputsData;
        if (isFlagSetInCommandLine("use_device_mem")) {
            if (device_name.find("GPU") == 0) {
                inputsData = ::gpu::get_remote_input_tensors(inputFiles,
                                                             app_inputs_info,
                                                             compiledModel,
                                                             clInputsBuffer,
                                                             inferRequestsQueue.requests.size());
                useGpuMem = true;
            } else if (device_name.find("CPU") == 0) {
                if (newInputType) {
                    inputsData = get_tensors(inputFiles, app_inputs_info);
                } else {
                    inputsData = get_tensors_static_case(
                        inputFiles.empty() ? std::vector<std::string>{} : inputFiles.begin()->second,
                        batchSize,
                        app_inputs_info[0],
                        nireq);
                }
            } else {
                throw ov::Exception("Requested device doesn't support `use_device_mem` option.");
            }
        } else {
            if (newInputType) {
                inputsData = get_tensors(inputFiles, app_inputs_info);
            } else {
                inputsData = get_tensors_static_case(
                    inputFiles.empty() ? std::vector<std::string>{} : inputFiles.begin()->second,
                    batchSize,
                    app_inputs_info[0],
                    nireq);
            }
        }
        // ----------------- 10. Measuring performance
        // ------------------------------------------------------------------
        size_t progressCnt = 0;
        size_t progressBarTotalCount = progressBarDefaultTotalCount;
        size_t iteration = 0;

        std::stringstream ss;
        ss << "Start inference " << FLAGS_api << "hronously";
        if (FLAGS_api == "async") {
            if (!ss.str().empty()) {
                ss << ", ";
            }
            ss << nireq << " inference requests";
            std::stringstream device_ss;
            for (auto& nstreams : device_nstreams) {
                if (!device_ss.str().empty()) {
                    device_ss << ", ";
                }
                device_ss << nstreams.second << " streams for " << nstreams.first;
            }
            if (!device_ss.str().empty()) {
                ss << " using " << device_ss.str();
            }
        }
        ss << ", limits: ";
        if (duration_seconds > 0) {
            ss << get_duration_in_milliseconds(duration_seconds) << " ms duration";
        }
        if (niter != 0) {
            if (duration_seconds == 0) {
                progressBarTotalCount = niter;
            }
            if (duration_seconds > 0) {
                ss << ", ";
            }
            ss << niter << " iterations";
        }

        next_step(ss.str());

        if (inferenceOnly) {
            slog::info << "BENCHMARK IS IN INFERENCE ONLY MODE." << slog::endl;
            slog::info << "Input blobs will be filled once before performance measurements." << slog::endl;
        } else {
            slog::info << "BENCHMARK IS IN FULL MODE." << slog::endl;
            slog::info << "Inputs setup stage will be included in performance measurements." << slog::endl;
        }

        // copy prepared data straight into inferRequest->getTensor()
        // for inference only mode
        if (inferenceOnly) {
            if (nireq < inputsData.begin()->second.size())
                slog::warn << "Only " << nireq << " test configs will be used." << slog::endl;
            size_t i = 0;
            for (auto& inferRequest : inferRequestsQueue.requests) {
                auto inputs = app_inputs_info[i % app_inputs_info.size()];
                for (auto& item : inputs) {
                    auto inputName = item.first;
                    const auto& inputTensor = inputsData.at(inputName)[i % inputsData.at(inputName).size()];
                    // for remote blobs setTensor is used, they are already allocated on the device
                    if (useGpuMem) {
                        inferRequest->set_tensor(inputName, inputTensor);
                    } else {
                        auto requestTensor = inferRequest->get_tensor(inputName);
                        if (isDynamicNetwork) {
                            requestTensor.set_shape(inputTensor.get_shape());
                        }
                        copy_tensor_data(requestTensor, inputTensor);
                    }
                }

                if (useGpuMem) {
                    auto outputTensors =
                        ::gpu::get_remote_output_tensors(compiledModel, inferRequest->get_output_cl_buffer());
                    for (auto& output : compiledModel.outputs()) {
                        inferRequest->set_tensor(output.get_any_name(), outputTensors[output.get_any_name()]);
                    }
                }
                ++i;
            }
        }

        // warming up - out of scope
        auto inferRequest = inferRequestsQueue.get_idle_request();
        if (!inferRequest) {
            throw ov::Exception("No idle Infer Requests!");
        }

        if (!inferenceOnly) {
            auto inputs = app_inputs_info[0];

            for (auto& item : inputs) {
                auto inputName = item.first;
                const auto& data = inputsData.at(inputName)[0];
                inferRequest->set_tensor(inputName, data);
            }

            if (useGpuMem) {
                auto outputTensors =
                    ::gpu::get_remote_output_tensors(compiledModel, inferRequest->get_output_cl_buffer());
                for (auto& output : compiledModel.outputs()) {
                    inferRequest->set_tensor(output.get_any_name(), outputTensors[output.get_any_name()]);
                }
            }
        }

        if (FLAGS_api == "sync") {
            inferRequest->infer();
        } else {
            inferRequest->start_async();
        }

        inferRequestsQueue.wait_all();

        auto duration_ms = inferRequestsQueue.get_latencies()[0];
        slog::info << "First inference took " << double_to_string(duration_ms) << " ms" << slog::endl;

        if (statistics) {
            statistics->add_parameters(
                StatisticsReport::Category::EXECUTION_RESULTS,
                {StatisticsVariant("first inference time (ms)", "first_inference_time", duration_ms)});
        }
        inferRequestsQueue.reset_times();

        size_t processedFramesN = 0;
        auto startTime = Time::now();
        auto execTime = std::chrono::duration_cast<ns>(Time::now() - startTime).count();

        /** Start inference & calculate performance **/
        /** to align number if iterations to guarantee that last infer requests are
         * executed in the same conditions **/
        ProgressBar progressBar(progressBarTotalCount, FLAGS_stream_output, FLAGS_progress);
        while ((niter != 0LL && iteration < niter) ||
               (duration_nanoseconds != 0LL && (uint64_t)execTime < duration_nanoseconds) ||
               (FLAGS_api == "async" && iteration % nireq != 0)) {
            inferRequest = inferRequestsQueue.get_idle_request();
            if (!inferRequest) {
                throw ov::Exception("No idle Infer Requests!");
            }

            if (!inferenceOnly) {
                auto inputs = app_inputs_info[iteration % app_inputs_info.size()];

                if (FLAGS_pcseq) {
                    inferRequest->set_latency_group_id(iteration % app_inputs_info.size());
                }

                if (isDynamicNetwork) {
                    batchSize = get_batch_size(inputs);
                    if (!std::any_of(inputs.begin(),
                                     inputs.end(),
                                     [](const std::pair<const std::string, benchmark_app::InputInfo>& info) {
                                         return ov::layout::has_batch(info.second.layout);
                                     })) {
                        slog::warn
                            << "No batch dimension was found, asssuming batch to be 1. Beware: this might affect "
                               "FPS calculation."
                            << slog::endl;
                    }
                }

                for (auto& item : inputs) {
                    auto inputName = item.first;
                    const auto& data = inputsData.at(inputName)[iteration % inputsData.at(inputName).size()];
                    inferRequest->set_tensor(inputName, data);
                }

                if (useGpuMem) {
                    auto outputTensors =
                        ::gpu::get_remote_output_tensors(compiledModel, inferRequest->get_output_cl_buffer());
                    for (auto& output : compiledModel.outputs()) {
                        inferRequest->set_tensor(output.get_any_name(), outputTensors[output.get_any_name()]);
                    }
                }
            }

            if (FLAGS_api == "sync") {
                inferRequest->infer();
            } else {
                // As the inference request is currently idle, the wait() adds no
                // additional overhead (and should return immediately). The primary
                // reason for calling the method is exception checking/re-throwing.
                // Callback, that governs the actual execution can handle errors as
                // well, but as it uses just error codes it has no details like ‘what()’
                // method of `std::exception` So, rechecking for any exceptions here.
                inferRequest->wait();
                inferRequest->start_async();
            }
            ++iteration;

            execTime = std::chrono::duration_cast<ns>(Time::now() - startTime).count();
            processedFramesN += batchSize;

            if (niter > 0) {
                progressBar.add_progress(1);
            } else {
                // calculate how many progress intervals are covered by current
                // iteration. depends on the current iteration time and time of each
                // progress interval. Previously covered progress intervals must be
                // skipped.
                auto progressIntervalTime = duration_nanoseconds / progressBarTotalCount;
                size_t newProgress = execTime / progressIntervalTime - progressCnt;
                progressBar.add_progress(newProgress);
                progressCnt += newProgress;
            }
        }

        // wait the latest inference executions
        inferRequestsQueue.wait_all();

        LatencyMetrics generalLatency(inferRequestsQueue.get_latencies(), "", FLAGS_latency_percentile);
        std::vector<LatencyMetrics> groupLatencies = {};
        if (FLAGS_pcseq && app_inputs_info.size() > 1) {
            const auto& lat_groups = inferRequestsQueue.get_latency_groups();
            for (int i = 0; i < lat_groups.size(); i++) {
                const auto& lats = lat_groups[i];

                std::string data_shapes_string = "";
                for (auto& item : app_inputs_info[i]) {
                    data_shapes_string += item.first + get_shape_string(item.second.dataShape) + ",";
                }
                data_shapes_string =
                    data_shapes_string == "" ? "" : data_shapes_string.substr(0, data_shapes_string.size() - 1);

                groupLatencies.emplace_back(lats, data_shapes_string, FLAGS_latency_percentile);
            }
        }

        double totalDuration = inferRequestsQueue.get_duration_in_milliseconds();
        double fps = (FLAGS_api == "sync") ? batchSize * 1000.0 / generalLatency.median_or_percentile
                                           : 1000.0 * processedFramesN / totalDuration;

        if (statistics) {
            statistics->add_parameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                       {StatisticsVariant("total execution time (ms)", "execution_time", totalDuration),
                                        StatisticsVariant("total number of iterations", "iterations_num", iteration)});
            if (device_name.find("MULTI") == std::string::npos) {
                std::string latency_label;
                if (FLAGS_latency_percentile == 50) {
                    latency_label = "Median latency (ms)";
                } else {
                    latency_label = "latency (" + std::to_string(FLAGS_latency_percentile) + " percentile) (ms)";
                }
                statistics->add_parameters(
                    StatisticsReport::Category::EXECUTION_RESULTS,
                    {StatisticsVariant(latency_label, "latency_median", generalLatency.median_or_percentile),
                     StatisticsVariant("Percentile boundary", "percentile_boundary", FLAGS_latency_percentile),
                     StatisticsVariant("Average latency (ms)", "latency_avg", generalLatency.avg),
                     StatisticsVariant("Min latency (ms)", "latency_min", generalLatency.min),
                     StatisticsVariant("Max latency (ms)", "latency_max", generalLatency.max)});

                if (FLAGS_pcseq && app_inputs_info.size() > 1) {
                    for (size_t i = 0; i < groupLatencies.size(); ++i) {
                        statistics->add_parameters(
                            StatisticsReport::Category::EXECUTION_RESULTS_GROUPPED,
                            {StatisticsVariant("Group Latencies", "group_latencies", groupLatencies[i])});
                    }
                }
            }
            statistics->add_parameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                       {StatisticsVariant("throughput", "throughput", fps)});
        }
        progressBar.finish();

        // ----------------- 11. Dumping statistics report
        // -------------------------------------------------------------
        next_step();

        if (!FLAGS_dump_config.empty()) {
            dump_config(FLAGS_dump_config, config);
            slog::info << "OpenVINO Runtime configuration settings were dumped to " << FLAGS_dump_config << slog::endl;
        }

        if (!FLAGS_exec_graph_path.empty()) {
            try {
                ov::serialize(compiledModel.get_runtime_model(), FLAGS_exec_graph_path);
                slog::info << "executable graph is stored to " << FLAGS_exec_graph_path << slog::endl;
            } catch (const std::exception& ex) {
                slog::err << "Can't get executable graph: " << ex.what() << slog::endl;
            }
        }

        if (perf_counts) {
            std::vector<std::vector<ov::ProfilingInfo>> perfCounts;
            for (size_t ireq = 0; ireq < nireq; ireq++) {
                auto reqPerfCounts = inferRequestsQueue.requests[ireq]->get_performance_counts();
                if (FLAGS_pc) {
                    slog::info << "Performance counts for " << ireq << "-th infer request:" << slog::endl;
                    printPerformanceCounts(reqPerfCounts, std::cout, getFullDeviceName(core, FLAGS_d), false);
                }
                perfCounts.push_back(reqPerfCounts);
            }
            if (statistics) {
                statistics->dump_performance_counters(perfCounts);
            }
        }

        if (statistics)
            statistics->dump();

        // Performance metrics report
        slog::info << "Count:      " << iteration << " iterations" << slog::endl;
        slog::info << "Duration:   " << double_to_string(totalDuration) << " ms" << slog::endl;
        if (device_name.find("MULTI") == std::string::npos) {
            slog::info << "Latency: " << slog::endl;
            generalLatency.write_to_slog();

            if (FLAGS_pcseq && app_inputs_info.size() > 1) {
                slog::info << "Latency for each data shape group:" << slog::endl;
                for (size_t i = 0; i < app_inputs_info.size(); ++i) {
                    slog::info << (i + 1) << ".";
                    for (auto& item : app_inputs_info[i]) {
                        std::stringstream input_shape;
                        auto shape = item.second.dataShape;
                        std::copy(shape.begin(), shape.end() - 1, std::ostream_iterator<size_t>(input_shape, ","));
                        input_shape << shape.back();
                        slog::info << " " << item.first << " : " << get_shape_string(item.second.dataShape);
                    }
                    slog::info << slog::endl;

                    groupLatencies[i].write_to_slog();
                }
            }
        }
        slog::info << "Throughput: " << double_to_string(fps) << " FPS" << slog::endl;

    } catch (const std::exception& ex) {
        slog::err << ex.what() << slog::endl;

        if (statistics) {
            statistics->add_parameters(StatisticsReport::Category::EXECUTION_RESULTS,
                                       {StatisticsVariant("error", "error", ex.what())});
            statistics->dump();
        }

        return 3;
    }

    return 0;
}
-												Update year to 2022 in copyright notice (#9755)


											
										
										
											2022-01-19 01:07:49 +03:00
+								// Copyright (C) 2018-2022 Intel Corporation
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								// SPDX-License-Identifier: Apache-2.0
 								//
 								#include <algorithm>
 								#include <chrono>
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								#include <map>
 								#include <memory>
 								#include <string>
 								#include <utility>
 								#include <vector>
-												ov2.0 IE samples modification (#8340)

* ov2.0 IE samples modification

apply code style

turn off clang style check for headers order

unify samples a bit

add yuv nv12 reader to format_reader, helloe_nv112 sample

hello_reshape_ssd ov2.0

* sync with PR 8629 preprocessing api changes

* fix for slog << vector<int>

* add operator<< for ov::Version from PR-8687

* Update samples/cpp/hello_nv12_input_classification/main.cpp

Co-authored-by: Mikhail Nosov <mikhail.nosov@intel.com>

* apply code style

* change according to review comments

* add const qualifier

* apply code style

* std::ostream for old inference engine version to make VPU plugin tests happy

* apply code style

* revert changes in print version for old api samples

* keep inference_engine.hpp for not ov2.0 yet samples

* fix merge artifacts

* fix compilation

* apply code style

* Fixed classification sample test

* Revert changes in hello_reshape_ssd sample

* rebase to master, sync with PR-9054

* fix issues found by C++ tests

* rebased and sync with PR-9051

* fix test result parsers for classification tests (except unicode one)

* fix mismatches after merge

* rebase and sync with PR-9144

Co-authored-by: Mikhail Nosov <mikhail.nosov@intel.com>
Co-authored-by: antonrom23 <anton.romanov@intel.com>
											
										
										
											2021-12-13 11:30:58 +03:00
 								// clang-format off
-												[IE Samples][OV2.0] final clean up of old API headers (#9494)

* final clean up of old API headers, compile_tool separated from samples

* make cpplint happy
											
										
										
											2022-01-13 11:12:20 +03:00
+								#include "openvino/openvino.hpp"
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								#include "openvino/pass/serialize.hpp"
-												ov2.0 IE samples modification (#8340)

* ov2.0 IE samples modification

apply code style

turn off clang style check for headers order

unify samples a bit

add yuv nv12 reader to format_reader, helloe_nv112 sample

hello_reshape_ssd ov2.0

* sync with PR 8629 preprocessing api changes

* fix for slog << vector<int>

* add operator<< for ov::Version from PR-8687

* Update samples/cpp/hello_nv12_input_classification/main.cpp

Co-authored-by: Mikhail Nosov <mikhail.nosov@intel.com>

* apply code style

* change according to review comments

* add const qualifier

* apply code style

* std::ostream for old inference engine version to make VPU plugin tests happy

* apply code style

* revert changes in print version for old api samples

* keep inference_engine.hpp for not ov2.0 yet samples

* fix merge artifacts

* fix compilation

* apply code style

* Fixed classification sample test

* Revert changes in hello_reshape_ssd sample

* rebase to master, sync with PR-9054

* fix issues found by C++ tests

* rebased and sync with PR-9051

* fix test result parsers for classification tests (except unicode one)

* fix mismatches after merge

* rebase and sync with PR-9144

Co-authored-by: Mikhail Nosov <mikhail.nosov@intel.com>
Co-authored-by: antonrom23 <anton.romanov@intel.com>
											
										
										
											2021-12-13 11:30:58 +03:00
 								#include "gna/gna_config.hpp"
 								#include "gpu/gpu_config.hpp"
 								#include "samples/args_helper.hpp"
 								#include "samples/common.hpp"
 								#include "samples/slog.hpp"
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								#include "benchmark_app.hpp"
 								#include "infer_request_wrap.hpp"
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								#include "inputs_filling.hpp"
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								#include "progress_bar.hpp"
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								#include "remote_tensors_filling.hpp"
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								#include "statistics_report.hpp"
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								#include "utils.hpp"
-												ov2.0 IE samples modification (#8340)

* ov2.0 IE samples modification

apply code style

turn off clang style check for headers order

unify samples a bit

add yuv nv12 reader to format_reader, helloe_nv112 sample

hello_reshape_ssd ov2.0

* sync with PR 8629 preprocessing api changes

* fix for slog << vector<int>

* add operator<< for ov::Version from PR-8687

* Update samples/cpp/hello_nv12_input_classification/main.cpp

Co-authored-by: Mikhail Nosov <mikhail.nosov@intel.com>

* apply code style

* change according to review comments

* add const qualifier

* apply code style

* std::ostream for old inference engine version to make VPU plugin tests happy

* apply code style

* revert changes in print version for old api samples

* keep inference_engine.hpp for not ov2.0 yet samples

* fix merge artifacts

* fix compilation

* apply code style

* Fixed classification sample test

* Revert changes in hello_reshape_ssd sample

* rebase to master, sync with PR-9054

* fix issues found by C++ tests

* rebased and sync with PR-9051

* fix test result parsers for classification tests (except unicode one)

* fix mismatches after merge

* rebase and sync with PR-9144

Co-authored-by: Mikhail Nosov <mikhail.nosov@intel.com>
Co-authored-by: antonrom23 <anton.romanov@intel.com>
											
										
										
											2021-12-13 11:30:58 +03:00
+								// clang-format on
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								static const size_t progressBarDefaultTotalCount = 1000;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												ncc build fixes (#10367)

* fix .ncc_style target names

it was breaking configure on system with libclang-12-dev, clang-12,
ninja and cmake 3.17+(ninja complains about duplicate
target). with lower cmake version configure succeeds, but build exits
immediately with error. by replacing ninja with make error becomes
warning(it's still significant, make just skips duplicate rules, i.e.
doesn't check style of some source files, rule duplication is genuine
bug). without libclang-12-dev and clang-12 ENABLE_NCC_STYLE is OFF and
bug is not triggered

* silence uninitialized warning in core_integration

probably it was always initialized before use, but compiler wasn't made
aware of it

* fix function spelling to unbreak code style checks in benchmark_app

* include <thread> for std::this_thread

existing code was relying on namespace pollution by old libstdc++

* replace is_pod with is_standard_layout && is_trivial

is_pod is deprecated, it breaks build on current gcc

Co-authored-by: Serhii Pavlovskyi <spavlovskyi@lohika.com>
Co-authored-by: Ilya Churaev <ilya.churaev@intel.com>
											
										
										
											2022-03-09 12:42:06 +02:00
+								bool parse_and_check_command_line(int argc, char* argv[]) {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								    // ---------------------------Parsing and validating input
 								    // arguments--------------------------------------
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    slog::info << "Parsing input parameters" << slog::endl;
 								    gflags::ParseCommandLineNonHelpFlags(&argc, &argv, true);
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								    if (FLAGS_help || FLAGS_h) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								        show_usage();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        showAvailableDevices();
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        return false;
 								    }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    if (FLAGS_m.empty()) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								        show_usage();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        throw std::logic_error("Model is required but not set. Please set -m option.");
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								    if (FLAGS_latency_percentile > 100 || FLAGS_latency_percentile < 1) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								        show_usage();
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								        throw std::logic_error("The percentile value is incorrect. The applicable values range is [1, 100].");
 								    }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    if (FLAGS_api != "async" && FLAGS_api != "sync") {
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        throw std::logic_error("Incorrect API. Please set -api option to `sync` or `async` value.");
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    }
-												 Modify for CVS-69023: hint configuration (#10259)

Signed-off-by: xuejun <xuejun.zhai@intel.com>
											
										
										
											2022-02-14 22:46:11 +08:00
+								    if (!FLAGS_hint.empty() && FLAGS_hint != "throughput" && FLAGS_hint != "tput" && FLAGS_hint != "latency" &&
-												selectdevice returns MULTI:device in cumulative_throughput (#11367)

* selectdevice returns MULTI:device in cumulative_throughput

* load multi with throughput and disable cpu helper in cumulative

* disable cpu helper in cumulative_throughput

* add cumulative to bechmark_app help message

* modify benchmark_app.hpp clang-format
											
										
										
											2022-05-06 12:42:59 +08:00
+								        FLAGS_hint != "cumulative_throughput" && FLAGS_hint != "ctput" && FLAGS_hint != "none") {
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								        throw std::logic_error("Incorrect performance hint. Please set -hint option to"
-												selectdevice returns MULTI:device in cumulative_throughput (#11367)

* selectdevice returns MULTI:device in cumulative_throughput

* load multi with throughput and disable cpu helper in cumulative

* disable cpu helper in cumulative_throughput

* add cumulative to bechmark_app help message

* modify benchmark_app.hpp clang-format
											
										
										
											2022-05-06 12:42:59 +08:00
+								                               "`throughput`(tput), `latency', 'cumulative_throughput'(ctput) value or 'none'.");
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								    }
-												[benchmark_app] Separate hint from fine tuning options. (#10919)

* Separate hint from fine tuning options.

* stylefix

* typo fix

* Order is changed
											
										
										
											2022-09-07 09:13:34 +03:00
+								    if (FLAGS_hint != "none" && (FLAGS_nstreams != "" || FLAGS_nthreads != 0 || FLAGS_pin != "")) {
 								        throw std::logic_error("-nstreams, -nthreads and -pin options are fine tune options. To use them you "
 								                               "should explicitely set -hint option to none. This is not OpenVINO limitation "
 								                               "(those options can be used in OpenVINO together), but a benchmark_app UI rule.");
 								    }
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								    if (!FLAGS_report_type.empty() && FLAGS_report_type != noCntReport && FLAGS_report_type != averageCntReport &&
 								        FLAGS_report_type != detailedCntReport) {
 								        std::string err = "only " + std::string(noCntReport) + "/" + std::string(averageCntReport) + "/" +
 								                          std::string(detailedCntReport) +
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                          " report types are supported (invalid -report_type option value)";
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        throw std::logic_error(err);
 								    }
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								    if ((FLAGS_report_type == averageCntReport) && ((FLAGS_d.find("MULTI") != std::string::npos))) {
 								        throw std::logic_error("only " + std::string(detailedCntReport) + " report type is supported for MULTI device");
 								    }
-												Update benchmark_app to pass precision via command line (#4318)

* Update benchmark_app to pass precision via command line

* Update vpu_perfcheck

* Update python benchmark_app to support setting precision from cmd

* Review comments

* Address more review comments

* Fixes after rebase
											
										
										
											2021-03-26 15:07:59 +03:00
+								    bool isNetworkCompiled = fileExt(FLAGS_m) == "blob";
 								    bool isPrecisionSet = !(FLAGS_ip.empty() && FLAGS_op.empty() && FLAGS_iop.empty());
 								    if (isNetworkCompiled && isPrecisionSet) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								        std::string err = std::string("Cannot set precision for a compiled network. ") +
 								                          std::string("Please re-compile your network with required precision "
 								                                      "using compile_tool");
-												Update benchmark_app to pass precision via command line (#4318)

* Update benchmark_app to pass precision via command line

* Update vpu_perfcheck

* Update python benchmark_app to support setting precision from cmd

* Review comments

* Address more review comments

* Fixes after rebase
											
										
										
											2021-03-26 15:07:59 +03:00
 								        throw std::logic_error(err);
 								    }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    return true;
 								}
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								static void next_step(const std::string additional_info = "") {
 								    static size_t step_id = 0;
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								    static const std::map<size_t, std::string> step_names = {
 								        {1, "Parsing and validating input arguments"},
-												DOCS: ported changes from 2022.1 release branch (#11206)

* Extensibility guide with FE extensions and remove OV_FRAMEWORK_MAP from docs

* Rework of Extensibility Intro, adopted examples to missing OPENVINO_FRAMEWORK_MAP

* Removed OPENVINO_FRAMEWORK_MAP reference

* Frontend extension detailed documentation

* Fixed distributed snippets

* Fixed snippet inclusion in FE extension document and chapter headers

* Fixed wrong name in a snippet reference

* Fixed test for template extension due to changed number of loaded extensions

* Update docs/Extensibility_UG/frontend_extensions.md

Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>

* Minor fixes in extension snippets

* Small grammar fix

Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>

Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>

* DOCS: transition banner (#10973)

* transition banner

* minor fix

* update transition banner

* updates

* update custom.js

* updates

* updates

* Documentation fixes (#11044)

* Benchmark app usage

* Fixed link to the devices

* More fixes

* Update docs/OV_Runtime_UG/multi_device.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Removed several hardcoded links

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Updated documentation for compile_tool (#11049)

* Added deployment guide (#11060)

* Added deployment guide

* Added local distribution

* Updates

* Fixed more indentations

* Removed obsolete code snippets (#11061)

* Removed obsolete code snippets

* NCC style

* Fixed NCC for BA

* Add a troubleshooting issue for PRC installation (#11074)

* updates

* adding gna to linux

* add missing reference

* update

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* update

* minor updates

* add gna item to yum and apt

* add gna to get started page

* update reference formatting

* merge commit

* add a troubleshooting issue

* update

* update

* fix CVS-71846

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* DOCS: fixed hardcoded links  (#11100)

* Fixes

* Use links

* applying reviewers comments to the Opt Guide (#11093)

* applying reviewrs comments

* fixed refs, more structuring (bold, bullets, etc)

* refactoring tput/latency sections

* next iteration (mostly latency), also brushed the auto-batching and other sections

* updates sync/async images

* common opts brushed

* WIP tput redesigned

* minor brushing of common and auto-batching

* Tput fully refactored

* fixed doc name in the link

* moved int8 perf counters to the right section

* fixed links

* fixed broken quotes

* fixed more links

* add ref to the internals to the TOC

* Added a note on the batch size

Co-authored-by: Andrey Zaytsev <andrey.zaytsev@intel.com>

* [80085] New images for docs (#11114)

* change doc structure

* fix manager tools

* fix manager tools 3 step

* fix manager tools 3 step

* new img

* new img for OV Runtime

* fix steps

* steps

* fix intendents

* change list

* fix space

* fix space

* code snippets fix

* change display

* Benchmarks 2022 1 (#11130)

* Minor fixes

* Updates for 2022.1

* Edits according to the review

* Edits according to review comments

* Edits according to review comments

* Edits according to review comments

* Fixed table

* Edits according to review comments

* Removed config for Intel® Core™ i7-11850HE

* Removed forward-tacotron-duration-prediction-241 graph

* Added resnet-18-pytorch

* Add info about Docker images in Deployment guide (#11136)

* Renamed user guides (#11137)

* fix screenshot (#11140)

* More conservative recommendations on dynamic shapes usage in docs (#11161)

* More conservative recommendations about using dynamic shapes

* Duplicated statement from C++ part to Python part of reshape doc (no semantical changes)

* Update ShapeInference.md (#11168)

* Benchmarks 2022 1 updates (#11180)

* Updated graphs

* Quick fix for TODO in Dynamic Shapes article

* Anchor link fixes

* Fixed DM config (#11199)

* DOCS: doxy sphinxtabs (#11027)

* initial implementation of doxy sphinxtabs

* fixes

* fixes

* fixes

* fixes

* fixes

* WA for ignored visibility attribute

* Fixes

Co-authored-by: Sergey Lyalin <sergey.lyalin@intel.com>
Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>
Co-authored-by: Nikolay Tyukaev <nikolay.tyukaev@intel.com>
Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>
Co-authored-by: Yuan Xu <yuan1.xu@intel.com>
Co-authored-by: Maxim Shevtsov <maxim.y.shevtsov@intel.com>
Co-authored-by: Andrey Zaytsev <andrey.zaytsev@intel.com>
Co-authored-by: Tatiana Savina <tatiana.savina@intel.com>
Co-authored-by: Ilya Naumov <ilya.naumov@intel.com>
Co-authored-by: Evgenya Stepyreva <evgenya.stepyreva@intel.com>
											
										
										
											2022-03-24 22:27:29 +03:00
+								        {2, "Loading OpenVINO Runtime"},
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								        {3, "Setting device configuration"},
 								        {4, "Reading network files"},
 								        {5, "Resizing network to match image sizes and given batch"},
 								        {6, "Configuring input of the model"},
 								        {7, "Loading the model to the device"},
 								        {8, "Setting optimal runtime parameters"},
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        {9, "Creating infer requests and preparing input blobs with data"},
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								        {10, "Measuring performance"},
 								        {11, "Dumping statistics report"}};
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
 								    step_id++;
-												Removed old headers from OV 2.0 API (#12214)

* Removed old headers from OV 2.0 API

* FIxed clang

* Fixed warning

* Updated OMZ submodule

* Fixed gpu tests build
											
										
										
											2022-08-12 11:35:36 +04:00
 								    OPENVINO_ASSERT(step_names.count(step_id) != 0,
 								                    "Step ID ",
 								                    step_id,
 								                    " is out of total steps number ",
 								                    step_names.size());
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
 								    std::cout << "[Step " << step_id << "/" << step_names.size() << "] " << step_names.at(step_id)
 								              << (additional_info.empty() ? "" : " (" + additional_info + ")") << std::endl;
 								}
-												 Modify for CVS-69023: hint configuration (#10259)

Signed-off-by: xuejun <xuejun.zhai@intel.com>
											
										
										
											2022-02-14 22:46:11 +08:00
+								ov::hint::PerformanceMode get_performance_hint(const std::string& device, const ov::Core& core) {
 								    ov::hint::PerformanceMode ov_perf_hint = ov::hint::PerformanceMode::UNDEFINED;
 								    auto supported_properties = core.get_property(device, ov::supported_properties);
 								    if (std::find(supported_properties.begin(), supported_properties.end(), ov::hint::performance_mode) !=
 								        supported_properties.end()) {
 								        if (FLAGS_hint != "") {
 								            if (FLAGS_hint == "throughput" || FLAGS_hint == "tput") {
 								                slog::warn << "Device(" << device << ") performance hint is set to THROUGHPUT" << slog::endl;
 								                ov_perf_hint = ov::hint::PerformanceMode::THROUGHPUT;
 								            } else if (FLAGS_hint == "latency") {
 								                slog::warn << "Device(" << device << ") performance hint is set to LATENCY" << slog::endl;
 								                ov_perf_hint = ov::hint::PerformanceMode::LATENCY;
-												selectdevice returns MULTI:device in cumulative_throughput (#11367)

* selectdevice returns MULTI:device in cumulative_throughput

* load multi with throughput and disable cpu helper in cumulative

* disable cpu helper in cumulative_throughput

* add cumulative to bechmark_app help message

* modify benchmark_app.hpp clang-format
											
										
										
											2022-05-06 12:42:59 +08:00
+								            } else if (FLAGS_hint == "cumulative_throughput" || FLAGS_hint == "ctput") {
 								                slog::warn << "Device(" << device << ") performance hint is set to CUMULATIVE_THROUGHPUT" << slog::endl;
 								                ov_perf_hint = ov::hint::PerformanceMode::CUMULATIVE_THROUGHPUT;
-												 Modify for CVS-69023: hint configuration (#10259)

Signed-off-by: xuejun <xuejun.zhai@intel.com>
											
										
										
											2022-02-14 22:46:11 +08:00
+								            } else if (FLAGS_hint == "none") {
 								                slog::warn << "No device(" << device << ") performance hint is set" << slog::endl;
 								                ov_perf_hint = ov::hint::PerformanceMode::UNDEFINED;
 								            }
 								        } else {
-												Set Latency performance mode in case of sync mode. (#10516)


											
										
										
											2022-02-21 18:08:05 +03:00
+								            ov_perf_hint =
 								                FLAGS_api == "sync" ? ov::hint::PerformanceMode::LATENCY : ov::hint::PerformanceMode::THROUGHPUT;
 								            slog::warn << "Performance hint was not explicitly specified in command line. "
-												 Modify for CVS-69023: hint configuration (#10259)

Signed-off-by: xuejun <xuejun.zhai@intel.com>
											
										
										
											2022-02-14 22:46:11 +08:00
+								                          "Device("
-												Set Latency performance mode in case of sync mode. (#10516)


											
										
										
											2022-02-21 18:08:05 +03:00
+								                       << device << ") performance hint will be set to " << ov_perf_hint << "." << slog::endl;
-												 Modify for CVS-69023: hint configuration (#10259)

Signed-off-by: xuejun <xuejun.zhai@intel.com>
											
										
										
											2022-02-14 22:46:11 +08:00
+								        }
 								    } else {
 								        if (FLAGS_hint != "") {
 								            slog::warn << "Device(" << device << ") does not support performance hint property(-hint)." << slog::endl;
 								        }
 								    }
 								    return ov_perf_hint;
 								}
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								/**
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								 * @brief The entry point of the benchmark application
 								 */
 								int main(int argc, char* argv[]) {
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								    std::shared_ptr<StatisticsReport> statistics;
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								    try {
-												Removed ov::runtime namespace (#9781)

* Removed ov::runtime namespace

* clang-format

* Fixes

* template reference

* Fixes
											
										
										
											2022-01-20 16:17:57 +03:00
+								        ov::CompiledModel compiledModel;
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // ----------------- 1. Parsing and validating input arguments
 								        // -------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												ncc build fixes (#10367)

* fix .ncc_style target names

it was breaking configure on system with libclang-12-dev, clang-12,
ninja and cmake 3.17+(ninja complains about duplicate
target). with lower cmake version configure succeeds, but build exits
immediately with error. by replacing ninja with make error becomes
warning(it's still significant, make just skips duplicate rules, i.e.
doesn't check style of some source files, rule duplication is genuine
bug). without libclang-12-dev and clang-12 ENABLE_NCC_STYLE is OFF and
bug is not triggered

* silence uninitialized warning in core_integration

probably it was always initialized before use, but compiler wasn't made
aware of it

* fix function spelling to unbreak code style checks in benchmark_app

* include <thread> for std::this_thread

existing code was relying on namespace pollution by old libstdc++

* replace is_pod with is_standard_layout && is_trivial

is_pod is deprecated, it breaks build on current gcc

Co-authored-by: Serhii Pavlovskyi <spavlovskyi@lohika.com>
Co-authored-by: Ilya Churaev <ilya.churaev@intel.com>
											
										
										
											2022-03-09 12:42:06 +02:00
+								        if (!parse_and_check_command_line(argc, argv)) {
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								            return 0;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        }
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        bool isNetworkCompiled = fileExt(FLAGS_m) == "blob";
 								        if (isNetworkCompiled) {
 								            slog::info << "Network is compiled" << slog::endl;
 								        }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        std::vector<gflags::CommandLineFlagInfo> flags;
 								        StatisticsReport::Parameters command_line_arguments;
 								        gflags::GetAllFlags(&flags);
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        for (auto& flag : flags) {
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            if (!flag.is_default) {
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                command_line_arguments.emplace_back(flag.name, flag.name, flag.current_value);
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								            }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        }
 								        if (!FLAGS_report_type.empty()) {
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								            statistics = FLAGS_json_stats ? std::make_shared<StatisticsReportJSON>(
 								                                                StatisticsReport::Config{FLAGS_report_type, FLAGS_report_folder})
 								                                          : std::make_shared<StatisticsReport>(
 								                                                StatisticsReport::Config{FLAGS_report_type, FLAGS_report_folder});
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								            statistics->add_parameters(StatisticsReport::Category::COMMAND_LINE_PARAMETERS, command_line_arguments);
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								        }
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        auto isFlagSetInCommandLine = [&command_line_arguments](const std::string& name) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								            return (std::find_if(command_line_arguments.begin(),
 								                                 command_line_arguments.end(),
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                                 [name](const StatisticsVariant& p) {
 								                                     return p.json_name == name;
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                                 }) != command_line_arguments.end());
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        };
 								        std::string device_name = FLAGS_d;
 								        // Parse devices
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								        auto devices = parse_devices(device_name);
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        // Parse nstreams per device
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								        std::map<std::string, std::string> device_nstreams = parse_value_per_device(devices, FLAGS_nstreams);
 								        std::map<std::string, std::string> device_infer_precision =
 								            parse_value_per_device(devices, FLAGS_infer_precision);
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
 								        // Load device config file if specified
-												OV 2.0 c++ configuration API (#9870)

* New configuration API

* Review fix

* review coments

* fixed device name map

* fixed header

* code stile

* fixed optimization capabilities

* flatten properties

* dox fix

* doc

* merge conflicts

* fixed merge conflicts

* Fixed subobject linkage warning

* foramt fix

* Fixed unity test build

* Merge conflict fixes

* Fixed variadic
											
										
										
											2022-01-25 12:43:56 +03:00
+								        std::map<std::string, ov::AnyMap> config;
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        if (!FLAGS_load_config.empty()) {
 								            load_config(FLAGS_load_config, config);
 								        }
-												[IE Samples] json configuration reader and dumper for benchmark_app (#9648)

* added load_config and dump_config functions implemented with json library

* add warning, upd readme

* Update samples/cpp/benchmark_app/README.md

Co-authored-by: Fedor Zharinov <fedor.zharinov@intel.com>

Co-authored-by: Fedor Zharinov <fedor.zharinov@intel.com>
											
										
										
											2022-01-18 11:22:47 +03:00
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        /** This vector stores paths to the processed images with input names**/
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								        auto inputFiles = parse_input_arguments(gflags::GetArgvs());
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												DOCS: ported changes from 2022.1 release branch (#11206)

* Extensibility guide with FE extensions and remove OV_FRAMEWORK_MAP from docs

* Rework of Extensibility Intro, adopted examples to missing OPENVINO_FRAMEWORK_MAP

* Removed OPENVINO_FRAMEWORK_MAP reference

* Frontend extension detailed documentation

* Fixed distributed snippets

* Fixed snippet inclusion in FE extension document and chapter headers

* Fixed wrong name in a snippet reference

* Fixed test for template extension due to changed number of loaded extensions

* Update docs/Extensibility_UG/frontend_extensions.md

Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>

* Minor fixes in extension snippets

* Small grammar fix

Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>

Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>

* DOCS: transition banner (#10973)

* transition banner

* minor fix

* update transition banner

* updates

* update custom.js

* updates

* updates

* Documentation fixes (#11044)

* Benchmark app usage

* Fixed link to the devices

* More fixes

* Update docs/OV_Runtime_UG/multi_device.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Removed several hardcoded links

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Updated documentation for compile_tool (#11049)

* Added deployment guide (#11060)

* Added deployment guide

* Added local distribution

* Updates

* Fixed more indentations

* Removed obsolete code snippets (#11061)

* Removed obsolete code snippets

* NCC style

* Fixed NCC for BA

* Add a troubleshooting issue for PRC installation (#11074)

* updates

* adding gna to linux

* add missing reference

* update

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* update

* minor updates

* add gna item to yum and apt

* add gna to get started page

* update reference formatting

* merge commit

* add a troubleshooting issue

* update

* update

* fix CVS-71846

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* DOCS: fixed hardcoded links  (#11100)

* Fixes

* Use links

* applying reviewers comments to the Opt Guide (#11093)

* applying reviewrs comments

* fixed refs, more structuring (bold, bullets, etc)

* refactoring tput/latency sections

* next iteration (mostly latency), also brushed the auto-batching and other sections

* updates sync/async images

* common opts brushed

* WIP tput redesigned

* minor brushing of common and auto-batching

* Tput fully refactored

* fixed doc name in the link

* moved int8 perf counters to the right section

* fixed links

* fixed broken quotes

* fixed more links

* add ref to the internals to the TOC

* Added a note on the batch size

Co-authored-by: Andrey Zaytsev <andrey.zaytsev@intel.com>

* [80085] New images for docs (#11114)

* change doc structure

* fix manager tools

* fix manager tools 3 step

* fix manager tools 3 step

* new img

* new img for OV Runtime

* fix steps

* steps

* fix intendents

* change list

* fix space

* fix space

* code snippets fix

* change display

* Benchmarks 2022 1 (#11130)

* Minor fixes

* Updates for 2022.1

* Edits according to the review

* Edits according to review comments

* Edits according to review comments

* Edits according to review comments

* Fixed table

* Edits according to review comments

* Removed config for Intel® Core™ i7-11850HE

* Removed forward-tacotron-duration-prediction-241 graph

* Added resnet-18-pytorch

* Add info about Docker images in Deployment guide (#11136)

* Renamed user guides (#11137)

* fix screenshot (#11140)

* More conservative recommendations on dynamic shapes usage in docs (#11161)

* More conservative recommendations about using dynamic shapes

* Duplicated statement from C++ part to Python part of reshape doc (no semantical changes)

* Update ShapeInference.md (#11168)

* Benchmarks 2022 1 updates (#11180)

* Updated graphs

* Quick fix for TODO in Dynamic Shapes article

* Anchor link fixes

* Fixed DM config (#11199)

* DOCS: doxy sphinxtabs (#11027)

* initial implementation of doxy sphinxtabs

* fixes

* fixes

* fixes

* fixes

* fixes

* WA for ignored visibility attribute

* Fixes

Co-authored-by: Sergey Lyalin <sergey.lyalin@intel.com>
Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>
Co-authored-by: Nikolay Tyukaev <nikolay.tyukaev@intel.com>
Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>
Co-authored-by: Yuan Xu <yuan1.xu@intel.com>
Co-authored-by: Maxim Shevtsov <maxim.y.shevtsov@intel.com>
Co-authored-by: Andrey Zaytsev <andrey.zaytsev@intel.com>
Co-authored-by: Tatiana Savina <tatiana.savina@intel.com>
Co-authored-by: Ilya Naumov <ilya.naumov@intel.com>
Co-authored-by: Evgenya Stepyreva <evgenya.stepyreva@intel.com>
											
										
										
											2022-03-24 22:27:29 +03:00
+								        // ----------------- 2. Loading the OpenVINO Runtime
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // -----------------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Removed ov::runtime namespace (#9781)

* Removed ov::runtime namespace

* clang-format

* Fixes

* template reference

* Fixes
											
										
										
											2022-01-20 16:17:57 +03:00
+								        ov::Core core;
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
-												-l option is replaced with -extensions (#10878)


											
										
										
											2022-04-04 16:08:38 +03:00
+								        if (!FLAGS_extensions.empty()) {
 								            // Extensions are loaded as a shared library
 								            core.add_extension(FLAGS_extensions);
 								            slog::info << "Extensions are loaded: " << FLAGS_extensions << slog::endl;
-												Publishing 2019 R1.1 content and Myriad plugin sources (#162)

* Publishing 2019 R1.1 content and Myriad plugin sources
											
										
										
											2019-05-27 21:18:32 +03:00
+								        }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        // Load clDNN Extensions
-												Publishing 2019 R1.1 content and Myriad plugin sources (#162)

* Publishing 2019 R1.1 content and Myriad plugin sources
											
										
										
											2019-05-27 21:18:32 +03:00
+								        if ((FLAGS_d.find("GPU") != std::string::npos) && !FLAGS_c.empty()) {
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            // Override config if command line parameter is specified
 								            if (!config.count("GPU"))
 								                config["GPU"] = {};
 								            config["GPU"][CONFIG_KEY(CONFIG_FILE)] = FLAGS_c;
 								        }
 								        if (config.count("GPU") && config.at("GPU").count(CONFIG_KEY(CONFIG_FILE))) {
-												OV 2.0 c++ configuration API (#9870)

* New configuration API

* Review fix

* review coments

* fixed device name map

* fixed header

* code stile

* fixed optimization capabilities

* flatten properties

* dox fix

* doc

* merge conflicts

* fixed merge conflicts

* Fixed subobject linkage warning

* foramt fix

* Fixed unity test build

* Merge conflict fixes

* Fixed variadic
											
										
										
											2022-01-25 12:43:56 +03:00
+								            auto ext = config.at("GPU").at(CONFIG_KEY(CONFIG_FILE)).as<std::string>();
 								            core.set_property("GPU", {{CONFIG_KEY(CONFIG_FILE), ext}});
-												-l option is replaced with -extensions (#10878)


											
										
										
											2022-04-04 16:08:38 +03:00
+								            slog::info << "GPU extensions are loaded: " << ext << slog::endl;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        }
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								        slog::info << "OpenVINO: " << ov::get_openvino_version() << slog::endl;
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        slog::info << "Device info: " << slog::endl;
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								        slog::info << core.get_versions(device_name) << slog::endl;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // ----------------- 3. Setting device configuration
 								        // -----------------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												[GPU] Add separate config for each device (#7421)


											
										
										
											2021-10-19 16:51:38 +03:00
+								        auto getDeviceTypeFromName = [](std::string device) -> std::string {
 								            return device.substr(0, device.find_first_of(".("));
 								        };
 								        // Set default values from dumped config
 								        std::set<std::string> default_devices;
 								        for (auto& device : devices) {
 								            auto default_config = config.find(getDeviceTypeFromName(device));
 								            if (default_config != config.end()) {
 								                if (!config.count(device)) {
 								                    config[device] = default_config->second;
 								                    default_devices.emplace(default_config->first);
 								                }
 								            }
 								        }
 								        for (auto& device : default_devices) {
 								            config.erase(device);
 								        }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        bool perf_counts = false;
-												[AUTO plugin] Fix benchmark failed to set nstreams on MULTI plugin (#12855)

* fix benchmark filed to pass on MULTI device when enable num_streams.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove part of test cases because MULTI plguin will not check if the unspported property is valid now.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove some incorrect config for MULTI test case since MULTI will pass through those unrecognized config without any exception.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support MULTI to set nstreams to multi target devices by using ov::device:properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support AUTO to set nstreams with multi target devices bu using ov:device::properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update format.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

Signed-off-by: Wang, Yang <yang4.wang@intel.com>
Co-authored-by: Chen Peter <peter.chen@intel.com>
											
										
										
											2022-09-27 23:42:40 +08:00
+								        // check if using the virtual device
 								        auto if_auto = std::find(devices.begin(), devices.end(), "AUTO") != devices.end();
 								        auto if_multi = std::find(devices.begin(), devices.end(), "MULTI") != devices.end();
 								        // Remove the hardware devices if AUTO/MULTI appears in the devices list.
 								        if (if_auto || if_multi) {
 								            devices.clear();
 								            std::string virtual_device;
 								            if (if_auto) {
 								                virtual_device = "AUTO";
 								                devices.push_back("AUTO");
 								            }
 								            if (if_multi) {
 								                virtual_device = "MULTI";
 								                devices.push_back("MULTI");
 								            }
 								            parse_value_for_virtual_device(virtual_device, device_nstreams);
 								            parse_value_for_virtual_device(virtual_device, device_infer_precision);
 								        }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        // Update config per device according to command line parameters
 								        for (auto& device : devices) {
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								            auto& device_config = config[device];
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								            // high-level performance modes
-												 Modify for CVS-69023: hint configuration (#10259)

Signed-off-by: xuejun <xuejun.zhai@intel.com>
											
										
										
											2022-02-14 22:46:11 +08:00
+								            auto ov_perf_hint = get_performance_hint(device, core);
-												PERF_COUNT replaced with ov::enable_profiling (#10118)

* String conversions in any

* Fixed chaching tests

* Fixed tests

* fixed build

* PERF_COUNT replaced with ov::enable_profiling

* fixed format

* fixed format

* fixed optimal config

* merge fix

* fix build

* format fix

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2022-02-05 13:27:46 +03:00
+								            if (ov_perf_hint != ov::hint::PerformanceMode::UNDEFINED) {
 								                device_config.emplace(ov::hint::performance_mode(ov_perf_hint));
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								                if (FLAGS_nireq != 0)
-												PERF_COUNT replaced with ov::enable_profiling (#10118)

* String conversions in any

* Fixed chaching tests

* Fixed tests

* fixed build

* PERF_COUNT replaced with ov::enable_profiling

* fixed format

* fixed format

* fixed optimal config

* merge fix

* fix build

* format fix

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2022-02-05 13:27:46 +03:00
+								                    device_config.emplace(ov::hint::num_requests(FLAGS_nireq));
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								            }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            // Set performance counter
 								            if (isFlagSetInCommandLine("pc")) {
 								                // set to user defined value
-												PERF_COUNT replaced with ov::enable_profiling (#10118)

* String conversions in any

* Fixed chaching tests

* Fixed tests

* fixed build

* PERF_COUNT replaced with ov::enable_profiling

* fixed format

* fixed format

* fixed optimal config

* merge fix

* fix build

* format fix

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2022-02-05 13:27:46 +03:00
+								                device_config.emplace(ov::enable_profiling(FLAGS_pc));
 								            } else if (device_config.count(ov::enable_profiling.name()) &&
 								                       (device_config.at(ov::enable_profiling.name()).as<bool>())) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                slog::warn << "Performance counters for " << device
 								                           << " device is turned on. To print results use -pc option." << slog::endl;
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            } else if (FLAGS_report_type == detailedCntReport || FLAGS_report_type == averageCntReport) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                slog::warn << "Turn on performance counters for " << device << " device since report type is "
 								                           << FLAGS_report_type << "." << slog::endl;
-												PERF_COUNT replaced with ov::enable_profiling (#10118)

* String conversions in any

* Fixed chaching tests

* Fixed tests

* fixed build

* PERF_COUNT replaced with ov::enable_profiling

* fixed format

* fixed format

* fixed optimal config

* merge fix

* fix build

* format fix

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2022-02-05 13:27:46 +03:00
+								                device_config.emplace(ov::enable_profiling(true));
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            } else if (!FLAGS_exec_graph_path.empty()) {
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                slog::warn << "Turn on performance counters for " << device << " device due to execution graph dumping."
 								                           << slog::endl;
-												PERF_COUNT replaced with ov::enable_profiling (#10118)

* String conversions in any

* Fixed chaching tests

* Fixed tests

* fixed build

* PERF_COUNT replaced with ov::enable_profiling

* fixed format

* fixed format

* fixed optimal config

* merge fix

* fix build

* format fix

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2022-02-05 13:27:46 +03:00
+								                device_config.emplace(ov::enable_profiling(true));
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            } else {
 								                // set to default value
-												PERF_COUNT replaced with ov::enable_profiling (#10118)

* String conversions in any

* Fixed chaching tests

* Fixed tests

* fixed build

* PERF_COUNT replaced with ov::enable_profiling

* fixed format

* fixed format

* fixed optimal config

* merge fix

* fix build

* format fix

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2022-02-05 13:27:46 +03:00
+								                device_config.emplace(ov::enable_profiling(FLAGS_pc));
-												Publishing 2020.2 content

											
										
										
											2020-04-13 21:17:23 +03:00
+								            }
-												PERF_COUNT replaced with ov::enable_profiling (#10118)

* String conversions in any

* Fixed chaching tests

* Fixed tests

* fixed build

* PERF_COUNT replaced with ov::enable_profiling

* fixed format

* fixed format

* fixed optimal config

* merge fix

* fix build

* format fix

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2022-02-05 13:27:46 +03:00
+								            perf_counts = (device_config.at(ov::enable_profiling.name()).as<bool>()) ? true : perf_counts;
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								            auto supported_properties = core.get_property(device, ov::supported_properties);
 								            auto supported = [&](const std::string& key) {
 								                return std::find(std::begin(supported_properties), std::end(supported_properties), key) !=
 								                       std::end(supported_properties);
 								            };
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								            // the rest are individual per-device settings (overriding the values set with perf modes)
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            auto setThroughputStreams = [&]() {
-												[GPU] Add new properties and fix bechmark_app (#10149)


											
										
										
											2022-02-09 09:18:54 +03:00
+								                std::string key = getDeviceTypeFromName(device) + "_THROUGHPUT_STREAMS";
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								                auto it_device_nstreams = device_nstreams.find(device);
 								                if (it_device_nstreams != device_nstreams.end()) {
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                    // set to user defined value
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								                    if (supported(key)) {
 								                        device_config[key] = it_device_nstreams->second;
 								                    } else if (supported(ov::num_streams.name())) {
-												[GPU] Add new properties and fix bechmark_app (#10149)


											
										
										
											2022-02-09 09:18:54 +03:00
+								                        // Use API 2.0 key for streams
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								                        key = ov::num_streams.name();
 								                        device_config[key] = it_device_nstreams->second;
-												[AUTO plugin] Fix benchmark failed to set nstreams on MULTI plugin (#12855)

* fix benchmark filed to pass on MULTI device when enable num_streams.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove part of test cases because MULTI plguin will not check if the unspported property is valid now.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove some incorrect config for MULTI test case since MULTI will pass through those unrecognized config without any exception.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support MULTI to set nstreams to multi target devices by using ov::device:properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support AUTO to set nstreams with multi target devices bu using ov:device::properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update format.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

Signed-off-by: Wang, Yang <yang4.wang@intel.com>
Co-authored-by: Chen Peter <peter.chen@intel.com>
											
										
										
											2022-09-27 23:42:40 +08:00
+								                    } else if (device == "MULTI" || device == "AUTO") {
 								                        // check if the element contains the hardware device property
 								                        auto value_vec = split(it_device_nstreams->second, ' ');
 								                        if (value_vec.size() == 1) {
 								                            key = ov::num_streams.name();
 								                            device_config[key] = it_device_nstreams->second;
 								                        } else {
 								                            // set device nstreams properties in the AUTO/MULTI plugin
 								                            std::stringstream strm(it_device_nstreams->second);
 								                            std::map<std::string, std::string> devices_property;
 								                            ov::util::Read<std::map<std::string, std::string>>{}(strm, devices_property);
 								                            for (auto it : devices_property) {
 								                                device_config.insert(
 								                                    ov::device::properties(it.first, ov::num_streams(std::stoi(it.second))));
 								                            }
 								                        }
-												[GPU] Add new properties and fix bechmark_app (#10149)


											
										
										
											2022-02-09 09:18:54 +03:00
+								                    } else {
 								                        throw std::logic_error("Device " + device + " doesn't support config key '" + key + "' " +
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								                                               "and '" + ov::num_streams.name() + "'!" +
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                                               "Please specify -nstreams for correct devices in format  "
 								                                               "<dev1>:<nstreams1>,<dev2>:<nstreams2>" +
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                                               " or via configuration file.");
 								                    }
-												PERF_COUNT replaced with ov::enable_profiling (#10118)

* String conversions in any

* Fixed chaching tests

* Fixed tests

* fixed build

* PERF_COUNT replaced with ov::enable_profiling

* fixed format

* fixed format

* fixed optimal config

* merge fix

* fix build

* format fix

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2022-02-05 13:27:46 +03:00
+								                } else if (ov_perf_hint == ov::hint::PerformanceMode::UNDEFINED && !device_config.count(key) &&
 								                           (FLAGS_api == "async")) {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                    slog::warn << "-nstreams default value is determined automatically for " << device
 								                               << " device. "
 								                                  "Although the automatic selection usually provides a "
 								                                  "reasonable performance, "
 								                                  "but it still may be non-optimal for some cases, for more "
 								                                  "information look at README."
 								                               << slog::endl;
-												[GPU] Add new properties and fix bechmark_app (#10149)


											
										
										
											2022-02-09 09:18:54 +03:00
+								                    if (std::string::npos == device.find("MYRIAD")) {  // MYRIAD sets the default number of
 								                                                                       // streams implicitly (without _AUTO)
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								                        if (supported(key)) {
-												[GPU] Add new properties and fix bechmark_app (#10149)


											
										
										
											2022-02-09 09:18:54 +03:00
+								                            device_config[key] = std::string(getDeviceTypeFromName(device) + "_THROUGHPUT_AUTO");
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								                        } else if (supported(ov::num_streams.name())) {
-												[GPU] Add new properties and fix bechmark_app (#10149)


											
										
										
											2022-02-09 09:18:54 +03:00
+								                            // Use API 2.0 key for streams
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								                            key = ov::num_streams.name();
-												Streams  property with special values (#10411)

* Streams  property with special values

* Fixed clang
											
										
										
											2022-02-17 16:39:06 +03:00
+								                            device_config[key] = ov::streams::AUTO;
-												[GPU] Add new properties and fix bechmark_app (#10149)


											
										
										
											2022-02-09 09:18:54 +03:00
+								                        }
 								                    }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                }
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								                auto it_streams = device_config.find(ov::num_streams.name());
 								                if (it_streams != device_config.end())
 								                    device_nstreams[device] = it_streams->second.as<std::string>();
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								            };
-												Publishing 2020.2 content

											
										
										
											2020-04-13 21:17:23 +03:00
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								            auto set_infer_precision = [&] {
 								                auto it_device_infer_precision = device_infer_precision.find(device);
 								                if (it_device_infer_precision != device_infer_precision.end()) {
 								                    // set to user defined value
 								                    if (!supported(ov::hint::inference_precision.name())) {
 								                        throw std::logic_error("Device " + device + " doesn't support config key '" +
 								                                               ov::hint::inference_precision.name() + "'! " +
 								                                               "Please specify -infer_precision for correct devices in format  "
 								                                               "<dev1>:<infer_precision1>,<dev2>:<infer_precision2>" +
 								                                               " or via configuration file.");
 								                    }
 								                    device_config.emplace(ov::hint::inference_precision(it_device_infer_precision->second));
 								                }
 								            };
 								            auto fix_pin_option = [](const std::string& str) -> std::string {
 								                if (str == "NO")
 								                    return "NONE";
 								                else if (str == "YES")
 								                    return "CORE";
 								                else
 								                    return str;
 								            };
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								            if (supported(ov::inference_num_threads.name()) && isFlagSetInCommandLine("nthreads")) {
 								                device_config.emplace(ov::inference_num_threads(FLAGS_nthreads));
 								            }
 								            if (supported(ov::affinity.name()) && isFlagSetInCommandLine("pin")) {
 								                device_config.emplace(ov::affinity(fix_pin_option(FLAGS_pin)));
 								            }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
-												[AUTO plugin] Fix benchmark failed to set nstreams on MULTI plugin (#12855)

* fix benchmark filed to pass on MULTI device when enable num_streams.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove part of test cases because MULTI plguin will not check if the unspported property is valid now.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove some incorrect config for MULTI test case since MULTI will pass through those unrecognized config without any exception.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support MULTI to set nstreams to multi target devices by using ov::device:properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support AUTO to set nstreams with multi target devices bu using ov:device::properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update format.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

Signed-off-by: Wang, Yang <yang4.wang@intel.com>
Co-authored-by: Chen Peter <peter.chen@intel.com>
											
										
										
											2022-09-27 23:42:40 +08:00
+								            if (device.find("CPU") != std::string::npos || device.find("GPU") != std::string::npos) {
 								                // CPU supports few special performance-oriented keys
 								                // for CPU and GPU execution, more throughput-oriented execution via streams
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                setThroughputStreams();
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								                set_infer_precision();
-												[AUTO plugin] Fix benchmark failed to set nstreams on MULTI plugin (#12855)

* fix benchmark filed to pass on MULTI device when enable num_streams.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove part of test cases because MULTI plguin will not check if the unspported property is valid now.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove some incorrect config for MULTI test case since MULTI will pass through those unrecognized config without any exception.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support MULTI to set nstreams to multi target devices by using ov::device:properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support AUTO to set nstreams with multi target devices bu using ov:device::properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update format.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

Signed-off-by: Wang, Yang <yang4.wang@intel.com>
Co-authored-by: Chen Peter <peter.chen@intel.com>
											
										
										
											2022-09-27 23:42:40 +08:00
+								            } else if (device.find("MYRIAD") != std::string::npos) {
 								                device_config.emplace(ov::log::level(ov::log::Level::WARNING));
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								                setThroughputStreams();
-												[AUTO plugin] Fix benchmark failed to set nstreams on MULTI plugin (#12855)

* fix benchmark filed to pass on MULTI device when enable num_streams.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove part of test cases because MULTI plguin will not check if the unspported property is valid now.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove some incorrect config for MULTI test case since MULTI will pass through those unrecognized config without any exception.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support MULTI to set nstreams to multi target devices by using ov::device:properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support AUTO to set nstreams with multi target devices bu using ov:device::properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update format.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

Signed-off-by: Wang, Yang <yang4.wang@intel.com>
Co-authored-by: Chen Peter <peter.chen@intel.com>
											
										
										
											2022-09-27 23:42:40 +08:00
+								            } else if (device.find("GNA") != std::string::npos) {
-												[GPU] Support hint::inference_precision (#12526)


											
										
										
											2022-08-15 16:34:36 +04:00
+								                set_infer_precision();
-												[AUTO plugin] Fix benchmark failed to set nstreams on MULTI plugin (#12855)

* fix benchmark filed to pass on MULTI device when enable num_streams.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove part of test cases because MULTI plguin will not check if the unspported property is valid now.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove some incorrect config for MULTI test case since MULTI will pass through those unrecognized config without any exception.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support MULTI to set nstreams to multi target devices by using ov::device:properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support AUTO to set nstreams with multi target devices bu using ov:device::properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update format.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

Signed-off-by: Wang, Yang <yang4.wang@intel.com>
Co-authored-by: Chen Peter <peter.chen@intel.com>
											
										
										
											2022-09-27 23:42:40 +08:00
+								            } else if (device.find("AUTO") != std::string::npos) {
 								                setThroughputStreams();
 								                set_infer_precision();
 								                device_nstreams.erase(device);
 								            } else if (device.find("MULTI") != std::string::npos) {
 								                setThroughputStreams();
 								                set_infer_precision();
 								                if ((device_name.find("GPU") != std::string::npos) && (device_name.find("CPU") != std::string::npos)) {
-												Set Latency performance mode in case of sync mode. (#10516)


											
										
										
											2022-02-21 18:08:05 +03:00
+								                    slog::warn << "GPU throttling is turned on. Multi-device execution with "
-												Typo fix (#6144)


											
										
										
											2021-06-14 22:47:59 +09:00
+								                                  "the CPU + GPU performs best with GPU throttling hint, "
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                               << "which releases another CPU thread (that is otherwise "
-												Set Latency performance mode in case of sync mode. (#10516)


											
										
										
											2022-02-21 18:08:05 +03:00
+								                                  "used by the GPU driver for active polling)."
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                               << slog::endl;
-												[AUTO plugin] Fix benchmark failed to set nstreams on MULTI plugin (#12855)

* fix benchmark filed to pass on MULTI device when enable num_streams.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove part of test cases because MULTI plguin will not check if the unspported property is valid now.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Remove some incorrect config for MULTI test case since MULTI will pass through those unrecognized config without any exception.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support MULTI to set nstreams to multi target devices by using ov::device:properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Support AUTO to set nstreams with multi target devices bu using ov:device::properties.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update format.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

Signed-off-by: Wang, Yang <yang4.wang@intel.com>
Co-authored-by: Chen Peter <peter.chen@intel.com>
											
										
										
											2022-09-27 23:42:40 +08:00
 								                    device_config.insert(ov::device::properties("GPU", {{GPU_CONFIG_KEY(PLUGIN_THROTTLE), 1}}));
 								                    // limit threading for CPU portion of inference
 								                    if (!isFlagSetInCommandLine("pin")) {
 								                        auto it_affinity = device_config.find(ov::affinity.name());
 								                        if (it_affinity != device_config.end()) {
 								                            slog::warn << "Turn off threads pinning for " << device
 								                                       << " device since multi-scenario with GPU device is used." << slog::endl;
 								                            it_affinity->second = ov::Affinity::NONE;
 								                        }
 								                    }
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								                }
-												[CVS-78727] bug fix for -d AUTO:CPU,GPU the return device should be AUTO only (#10417)

Signed-off-by: xuejun <xuejun.zhai@intel.com>
											
										
										
											2022-02-18 14:56:56 +08:00
+								                device_nstreams.erase(device);
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        for (auto&& item : config) {
-												OV 2.0 c++ configuration API (#9870)

* New configuration API

* Review fix

* review coments

* fixed device name map

* fixed header

* code stile

* fixed optimization capabilities

* flatten properties

* dox fix

* doc

* merge conflicts

* fixed merge conflicts

* Fixed subobject linkage warning

* foramt fix

* Fixed unity test build

* Merge conflict fixes

* Fixed variadic
											
										
										
											2022-01-25 12:43:56 +03:00
+								            core.set_property(item.first, item.second);
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        }
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        size_t batchSize = FLAGS_b;
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								        ov::element::Type type = ov::element::undefined;
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        std::string topology_name = "";
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        std::vector<benchmark_app::InputsInfo> app_inputs_info;
-												Adds support of user layouts to benchmark_app (#4002)

* Adds support of user layouts to benchmark_app

* Keep snake_case for python

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2021-02-11 12:57:05 +03:00
+								        std::string output_name;
-												[Caching] Add caching options to benchmark app (#4909)

* Python API for LoadNetwork by model file name

* BenchmarkApp: Add caching and LoadNetworkFromFile support

    2 new options are introduced
    - cache_dir <dir> - enables models caching
    - load_from_file - use new perform "LoadNetwork" by model file name

    Using both parameters will achieve maximum performance of read/load network on startup

    Tests:
    1) Run "benchmark_app -h". Help will display 2 new options. After available devices there will be list of devices with cache support
    2) ./benchmark_app -d CPU -i <model.xml> -load_from_file
    Verify that some test steps are skipped (related to ReadNetwork, re-shaping etc)
    3) Pre-requisite: support of caching shall be enabled for Template plugin
    ./benchmark_app -d TEMPLATE -i <model.onnx> -load_from_file -cache_dir someDir
    Verify that "someDir" is created and generated blob is available
    Run again, verify that loading works as well (should be faster as it will not load onnx model)
    4) Run same test as (3), but without -load_from_file option. Verify that cache is properly created
    For some devices loadNetwork time shall be improved when cache is available

* Removed additional timing prints

* Correction from old code

* Revert "Removed additional timing prints"

Additional change - when .blob is chosen instead of .xml, it takes priority over caching flags

* Removed new time printings

As discussed, these time measurements like 'total first inference time' will be available in 'timeTests' scripts

* Fix clang-format issues
											
										
										
											2021-05-17 13:41:15 +03:00
 								        // Takes priority over config from file
 								        if (!FLAGS_cache_dir.empty()) {
-												New configuration API in set get property (#10012)

* New configuration API in set|get property

* removed supported metrics and keys

* Fixed build

* Fixed build

* Fixed samples build

* Fixed samples build

* Fixed build

* Removed old properties in plugin

* Fixed build
											
										
										
											2022-02-01 13:05:14 +03:00
+								            core.set_property(ov::cache_dir(FLAGS_cache_dir));
-												[Caching] Add caching options to benchmark app (#4909)

* Python API for LoadNetwork by model file name

* BenchmarkApp: Add caching and LoadNetworkFromFile support

    2 new options are introduced
    - cache_dir <dir> - enables models caching
    - load_from_file - use new perform "LoadNetwork" by model file name

    Using both parameters will achieve maximum performance of read/load network on startup

    Tests:
    1) Run "benchmark_app -h". Help will display 2 new options. After available devices there will be list of devices with cache support
    2) ./benchmark_app -d CPU -i <model.xml> -load_from_file
    Verify that some test steps are skipped (related to ReadNetwork, re-shaping etc)
    3) Pre-requisite: support of caching shall be enabled for Template plugin
    ./benchmark_app -d TEMPLATE -i <model.onnx> -load_from_file -cache_dir someDir
    Verify that "someDir" is created and generated blob is available
    Run again, verify that loading works as well (should be faster as it will not load onnx model)
    4) Run same test as (3), but without -load_from_file option. Verify that cache is properly created
    For some devices loadNetwork time shall be improved when cache is available

* Removed additional timing prints

* Correction from old code

* Revert "Removed additional timing prints"

Additional change - when .blob is chosen instead of .xml, it takes priority over caching flags

* Removed new time printings

As discussed, these time measurements like 'total first inference time' will be available in 'timeTests' scripts

* Fix clang-format issues
											
										
										
											2021-05-17 13:41:15 +03:00
+								        }
-												[Benchmark] benchmark_app need disable auto batching if batch size is set.  (#12553)

* When set batch_size, disable auto batching

* auto-batch only supprt auto plugin

* Set property allow_auto_batching for devices

* cancel static

* Clean Code

* Add test case for testing allow_auto_batching

* Fix the issue after merging latest master branch code

* Add allow_auto_batching in python benchmark_app

* Fix the quotes issue

* When load_network is set to allow-auto-batching, there is no need to read the value of global

* Fix the clang-format

* Change the location

Co-authored-by: River Li <river.li@intel.com>
Co-authored-by: Chen Peter <peter.chen@intel.com>
											
										
										
											2022-09-22 09:50:30 +08:00
+								        // If set batch size, disable the auto batching
 								        if (FLAGS_b > 0) {
 								            core.set_property(ov::hint::allow_auto_batching(false));
 								        }
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        bool isDynamicNetwork = false;
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
-												[Caching] Add caching options to benchmark app (#4909)

* Python API for LoadNetwork by model file name

* BenchmarkApp: Add caching and LoadNetworkFromFile support

    2 new options are introduced
    - cache_dir <dir> - enables models caching
    - load_from_file - use new perform "LoadNetwork" by model file name

    Using both parameters will achieve maximum performance of read/load network on startup

    Tests:
    1) Run "benchmark_app -h". Help will display 2 new options. After available devices there will be list of devices with cache support
    2) ./benchmark_app -d CPU -i <model.xml> -load_from_file
    Verify that some test steps are skipped (related to ReadNetwork, re-shaping etc)
    3) Pre-requisite: support of caching shall be enabled for Template plugin
    ./benchmark_app -d TEMPLATE -i <model.onnx> -load_from_file -cache_dir someDir
    Verify that "someDir" is created and generated blob is available
    Run again, verify that loading works as well (should be faster as it will not load onnx model)
    4) Run same test as (3), but without -load_from_file option. Verify that cache is properly created
    For some devices loadNetwork time shall be improved when cache is available

* Removed additional timing prints

* Correction from old code

* Revert "Removed additional timing prints"

Additional change - when .blob is chosen instead of .xml, it takes priority over caching flags

* Removed new time printings

As discussed, these time measurements like 'total first inference time' will be available in 'timeTests' scripts

* Fix clang-format issues
											
										
										
											2021-05-17 13:41:15 +03:00
+								        if (FLAGS_load_from_file && !isNetworkCompiled) {
 								            next_step();
 								            slog::info << "Skipping the step for loading network from file" << slog::endl;
 								            next_step();
 								            slog::info << "Skipping the step for loading network from file" << slog::endl;
 								            next_step();
 								            slog::info << "Skipping the step for loading network from file" << slog::endl;
 								            auto startTime = Time::now();
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								            compiledModel = core.compile_model(FLAGS_m, device_name);
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								            auto duration_ms = get_duration_ms_till_now(startTime);
 								            slog::info << "Load network took " << double_to_string(duration_ms) << " ms" << slog::endl;
-												[benchmark_app]Show network original I/O info (#10694)

* Show network original I/O info

* additional no-name case check

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
											
										
										
											2022-03-21 13:57:56 +03:00
+								            slog::info << "Original network I/O parameters:" << slog::endl;
 								            printInputAndOutputsInfoShort(compiledModel);
-												[Caching] Add caching options to benchmark app (#4909)

* Python API for LoadNetwork by model file name

* BenchmarkApp: Add caching and LoadNetworkFromFile support

    2 new options are introduced
    - cache_dir <dir> - enables models caching
    - load_from_file - use new perform "LoadNetwork" by model file name

    Using both parameters will achieve maximum performance of read/load network on startup

    Tests:
    1) Run "benchmark_app -h". Help will display 2 new options. After available devices there will be list of devices with cache support
    2) ./benchmark_app -d CPU -i <model.xml> -load_from_file
    Verify that some test steps are skipped (related to ReadNetwork, re-shaping etc)
    3) Pre-requisite: support of caching shall be enabled for Template plugin
    ./benchmark_app -d TEMPLATE -i <model.onnx> -load_from_file -cache_dir someDir
    Verify that "someDir" is created and generated blob is available
    Run again, verify that loading works as well (should be faster as it will not load onnx model)
    4) Run same test as (3), but without -load_from_file option. Verify that cache is properly created
    For some devices loadNetwork time shall be improved when cache is available

* Removed additional timing prints

* Correction from old code

* Revert "Removed additional timing prints"

Additional change - when .blob is chosen instead of .xml, it takes priority over caching flags

* Removed new time printings

As discussed, these time measurements like 'total first inference time' will be available in 'timeTests' scripts

* Fix clang-format issues
											
										
										
											2021-05-17 13:41:15 +03:00
+								            if (statistics)
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                statistics->add_parameters(
 								                    StatisticsReport::Category::EXECUTION_RESULTS,
 								                    {StatisticsVariant("load network time (ms)", "load_network_time", duration_ms)});
-												Benchmark_app: Command line args processing is modified to use both tensor and corresponding node names (#9968)

* Node/name conversions

* stylefix
											
										
										
											2022-02-01 16:05:00 +03:00
 								            convert_io_names_in_map(inputFiles, compiledModel.inputs());
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								            app_inputs_info = get_inputs_info(FLAGS_shape,
 								                                              FLAGS_layout,
 								                                              batchSize,
 								                                              FLAGS_data_shape,
 								                                              inputFiles,
 								                                              FLAGS_iscale,
 								                                              FLAGS_imean,
 								                                              compiledModel.inputs());
-												[Caching] Add caching options to benchmark app (#4909)

* Python API for LoadNetwork by model file name

* BenchmarkApp: Add caching and LoadNetworkFromFile support

    2 new options are introduced
    - cache_dir <dir> - enables models caching
    - load_from_file - use new perform "LoadNetwork" by model file name

    Using both parameters will achieve maximum performance of read/load network on startup

    Tests:
    1) Run "benchmark_app -h". Help will display 2 new options. After available devices there will be list of devices with cache support
    2) ./benchmark_app -d CPU -i <model.xml> -load_from_file
    Verify that some test steps are skipped (related to ReadNetwork, re-shaping etc)
    3) Pre-requisite: support of caching shall be enabled for Template plugin
    ./benchmark_app -d TEMPLATE -i <model.onnx> -load_from_file -cache_dir someDir
    Verify that "someDir" is created and generated blob is available
    Run again, verify that loading works as well (should be faster as it will not load onnx model)
    4) Run same test as (3), but without -load_from_file option. Verify that cache is properly created
    For some devices loadNetwork time shall be improved when cache is available

* Removed additional timing prints

* Correction from old code

* Revert "Removed additional timing prints"

Additional change - when .blob is chosen instead of .xml, it takes priority over caching flags

* Removed new time printings

As discussed, these time measurements like 'total first inference time' will be available in 'timeTests' scripts

* Fix clang-format issues
											
										
										
											2021-05-17 13:41:15 +03:00
+								            if (batchSize == 0) {
 								                batchSize = 1;
 								            }
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
-												[Caching] Add caching options to benchmark app (#4909)

* Python API for LoadNetwork by model file name

* BenchmarkApp: Add caching and LoadNetworkFromFile support

    2 new options are introduced
    - cache_dir <dir> - enables models caching
    - load_from_file - use new perform "LoadNetwork" by model file name

    Using both parameters will achieve maximum performance of read/load network on startup

    Tests:
    1) Run "benchmark_app -h". Help will display 2 new options. After available devices there will be list of devices with cache support
    2) ./benchmark_app -d CPU -i <model.xml> -load_from_file
    Verify that some test steps are skipped (related to ReadNetwork, re-shaping etc)
    3) Pre-requisite: support of caching shall be enabled for Template plugin
    ./benchmark_app -d TEMPLATE -i <model.onnx> -load_from_file -cache_dir someDir
    Verify that "someDir" is created and generated blob is available
    Run again, verify that loading works as well (should be faster as it will not load onnx model)
    4) Run same test as (3), but without -load_from_file option. Verify that cache is properly created
    For some devices loadNetwork time shall be improved when cache is available

* Removed additional timing prints

* Correction from old code

* Revert "Removed additional timing prints"

Additional change - when .blob is chosen instead of .xml, it takes priority over caching flags

* Removed new time printings

As discussed, these time measurements like 'total first inference time' will be available in 'timeTests' scripts

* Fix clang-format issues
											
										
										
											2021-05-17 13:41:15 +03:00
+								        } else if (!isNetworkCompiled) {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            // ----------------- 4. Reading the Intermediate Representation network
 								            // ----------------------------------------
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            next_step();
 								            slog::info << "Loading network files" << slog::endl;
 								            auto startTime = Time::now();
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								            auto model = core.read_model(FLAGS_m);
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								            auto duration_ms = get_duration_ms_till_now(startTime);
 								            slog::info << "Read network took " << double_to_string(duration_ms) << " ms" << slog::endl;
-												[benchmark_app]Show network original I/O info (#10694)

* Show network original I/O info

* additional no-name case check

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
											
										
										
											2022-03-21 13:57:56 +03:00
+								            slog::info << "Original network I/O parameters:" << slog::endl;
 								            printInputAndOutputsInfoShort(*model);
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            if (statistics)
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                statistics->add_parameters(
 								                    StatisticsReport::Category::EXECUTION_RESULTS,
 								                    {StatisticsVariant("read network time (ms)", "read_network_time", duration_ms)});
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								            const auto& inputInfo = std::const_pointer_cast<const ov::Model>(model)->inputs();
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            if (inputInfo.empty()) {
 								                throw std::logic_error("no inputs info is provided");
 								            }
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            // ----------------- 5. Resizing network to match image sizes and given
 								            // batch ----------------------------------
-												[CPU] OneDNN 2.6 migration (#11627)

* Migrate on OneDNN 2.7

* [CPU] Enabled brconv implementation

* Post ops optimizations

* [CPU] Enabled I8 precision on activations for Convolution node

* [CPU][WA] Disabled Deconvolution + post ops fusing optimization

* Fixed FQ post op optimization

* [CPU] Optimize post ops processing

* [WA] Add node name if tensor names are empty

* [WA] remove  layout compatibility chheck that leads to the fase-positive exceptions

* [CPU] Optimize processing for FQ + Sum + FQ post ops pattern

* [CPU][WA] Enabled ReduceSum -> AvgPool transformation due to perf issues

* fix compiler error

* rebase onednn master

* cherry pick from 2.7 to 2.6

* [WA] make cpu case to run completed

* fix xmm zero check

* reopen 'FuseDeconvolutionAndSimpleOperation' Transform  to fix CPU 'ConvolutionBackpropDataLayerTest' fail issue

* [WR] Removed failed the ReduceMean tests caused by 21f3555.

* group deconv may crash on memory out of bound

* [WA] Remove the moc fail case by #af4731a1

* testcase conv maxpool will check brgconv instead of jit

* test subgraph added nhwc format check

* fix gemm bf16 win crash

* fix avx2 groupconv accuracy problem

* [WA] remove invalid FQ tests

* WR to disable the LPT multiplyToGroupConv test because the  transformation was disabled in d5e16f

* add gemm int8 binary postops to fix GroupConvolutionQDqTransformation fail

* add gemm int8 binary postops to fix GroupConvolutionQDqTransformation fail

* fix gemm bf16 fail

* Fix ConcatConvSumInPlaceTest

* Add cpuDebugFuncTests target

* [WA] bf16 crash due to MemoryInput/Output

* OVClassBasicTest case typo

* testcase subgraph sets default ENFORCE_BF16 to NO

* fix clang check

* Fix primType check issue

* Fix cpplint error

* MemoryInput/Output support bf16; Enforce bf16 'NO' should enable snipptes

* disable BF16 fusing fakequant testcase

* testcase init support amx check

* testcase for conv brgconv avx512/amx

* testcase for conv brgconv avx512/amx

* WR enforce reorder bug and add NSPC into deconv supported list.

* Compiling issue fix.

* [WA] skip fakequantize fusing in bf16

* mix legacy/new binary postops

* make nightly case run. tested on amx/avx512/avx2.

* [CPU] Add BF16 AMX test for Matmul

* Add CPU dump check tool

* Add verbose log

* Generate exec graph in cpu dump check tool

* fix binary prelu post Ops

* fix cpplint

* Update ONEDNN version to fix AVX2 bug.

* cpu dump check supports compare dump files

* Add a new CPU_DEBUG_CAPS: OV_CPU_SUMMARY_PERF

* change VERBOSE_LOG to DEBUG_LOG

* fix oneDNN register_jit_code log

* fix cpplint

* Add OV_CPU_DEBUG_LOG controls debug logs to show

* Revert reorder WR.

* Enhanced CPU debug logs and breakpoint support

* Enhanced cpu_dump_check with --ports

* Fix DEBUG_LOG compile issue

* GroupDeconvolutionLayerCPUTest extend to add amx test cases

* Add Node into DBUEG_LOG

* cpu_dump_check: Dump results even no port is specified

* FIx MergeTransposeAndReorder for blocked input

* Fix cpu_dump_check result names

* Enhance DEBUG_LOG on edges

* Cpu dump check support shape mismatch

* Fix bi-directionl inplace

* Cpu dump check support inference_precion_hing f32.

* fix windows dump fail.

* fix depthwise nwc conv

* add rtol arg

* win debugbreak

* fix pooling accuracy

* GroupDeconvolutionLayerCPUTest remove invalid test param for nspc

* recover ov onednn fork

* revert af4731a1f1e085f959d2612b656b50f75c0fbc98 '[WA] remove layout compatibility chheck'

* [WA] disable avx2 conv3d fusing case

* [WA] disable avx2 conv3d fusing case

* [WA] Disabled weights md transpose in FC to prevent perf degradations

Co-authored-by: dmitrygo <dmitry.gorokhov@intel.com>
Co-authored-by: Vladislav Golubev <vladislav.golubev@intel.com>
Co-authored-by: Zhang Yi3 <yi3.zhang@intel.com>
Co-authored-by: liubo-intel <bo4.liu@intel.com>
Co-authored-by: Luwei Zhou <luwei.zhou@intel.com>
Co-authored-by: Li, Tingqian <tingqian.li@intel.com>
Co-authored-by: xuchen-intel <chen.xu@intel.com>
Co-authored-by: ceciliapeng2011 <cecilia.peng@intel.com>
											
										
										
											2022-06-06 18:30:32 +08:00
+								            for (auto& item : model->inputs()) {
 								                if (item.get_tensor().get_names().empty()) {
 								                    item.get_tensor_ptr()->set_names(
 								                        std::unordered_set<std::string>{item.get_node_shared_ptr()->get_name()});
 								                }
 								            }
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            next_step();
-												Benchmark_app: Command line args processing is modified to use both tensor and corresponding node names (#9968)

* Node/name conversions

* stylefix
											
										
										
											2022-02-01 16:05:00 +03:00
+								            convert_io_names_in_map(inputFiles, std::const_pointer_cast<const ov::Model>(model)->inputs());
-												publish master branch snapshot, revision 49482ae3bea0cbaa07474f86f36db11943142687

											
										
										
											2020-05-13 21:12:22 +03:00
+								            // Parse input shapes if specified
 								            bool reshape = false;
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								            app_inputs_info = get_inputs_info(FLAGS_shape,
 								                                              FLAGS_layout,
 								                                              FLAGS_b,
 								                                              FLAGS_data_shape,
 								                                              inputFiles,
 								                                              FLAGS_iscale,
 								                                              FLAGS_imean,
 								                                              inputInfo,
 								                                              reshape);
-												publish master branch snapshot, revision 49482ae3bea0cbaa07474f86f36db11943142687

											
										
										
											2020-05-13 21:12:22 +03:00
+								            if (reshape) {
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                benchmark_app::PartialShapes shapes = {};
 								                for (auto& item : app_inputs_info[0])
 								                    shapes[item.first] = item.second.partialShape;
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                slog::info << "Reshaping network: " << get_shapes_string(shapes) << slog::endl;
-												publish master branch snapshot, revision 49482ae3bea0cbaa07474f86f36db11943142687

											
										
										
											2020-05-13 21:12:22 +03:00
+								                startTime = Time::now();
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                model->reshape(shapes);
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                duration_ms = get_duration_ms_till_now(startTime);
 								                slog::info << "Reshape network took " << double_to_string(duration_ms) << " ms" << slog::endl;
-												publish master branch snapshot, revision 49482ae3bea0cbaa07474f86f36db11943142687

											
										
										
											2020-05-13 21:12:22 +03:00
+								                if (statistics)
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                    statistics->add_parameters(
 								                        StatisticsReport::Category::EXECUTION_RESULTS,
 								                        {StatisticsVariant("reshape network time (ms)", "reshape_network_time", duration_ms)});
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            }
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
 								            // ----------------- 6. Configuring inputs and outputs
 								            // ----------------------------------------------------------------------
 								            next_step();
 								            auto preproc = ov::preprocess::PrePostProcessor(model);
-												OV 2.0 c++ configuration API (#9870)

* New configuration API

* Review fix

* review coments

* fixed device name map

* fixed header

* code stile

* fixed optimization capabilities

* flatten properties

* dox fix

* doc

* merge conflicts

* fixed merge conflicts

* Fixed subobject linkage warning

* foramt fix

* Fixed unity test build

* Merge conflict fixes

* Fixed variadic
											
										
										
											2022-01-25 12:43:56 +03:00
+								            std::map<std::string, std::string> user_precisions_map;
-												Benchmark_app batch calculation fix (#9554)

* BenchmarkApp - batch size calculation fix

* stylefix

* -ip/op fix

* stylefix
											
										
										
											2022-01-13 23:34:38 +03:00
+								            if (!FLAGS_iop.empty()) {
 								                user_precisions_map = parseArgMap(FLAGS_iop);
-												Benchmark_app: Command line args processing is modified to use both tensor and corresponding node names (#9968)

* Node/name conversions

* stylefix
											
										
										
											2022-02-01 16:05:00 +03:00
+								                convert_io_names_in_map(user_precisions_map,
 								                                        std::const_pointer_cast<const ov::Model>(model)->inputs(),
 								                                        std::const_pointer_cast<const ov::Model>(model)->outputs());
-												Benchmark_app batch calculation fix (#9554)

* BenchmarkApp - batch size calculation fix

* stylefix

* -ip/op fix

* stylefix
											
										
										
											2022-01-13 23:34:38 +03:00
+								            }
 								            const auto input_precision = FLAGS_ip.empty() ? ov::element::undefined : getPrecision2(FLAGS_ip);
 								            const auto output_precision = FLAGS_op.empty() ? ov::element::undefined : getPrecision2(FLAGS_op);
-												Benchmarkapp: Added processing of inputs/outputs by index (#9703)

* Added processing of inputs/outputs by index

* fix

* All tensor's get_friendly_name are replaced with get_any_name

* stylefix
											
										
										
											2022-01-18 13:40:54 +03:00
+								            const auto& inputs = model->inputs();
 								            for (int i = 0; i < inputs.size(); i++) {
 								                const auto& item = inputs[i];
 								                auto iop_precision = ov::element::undefined;
 								                auto type_to_set = ov::element::undefined;
 								                std::string name;
 								                try {
 								                    // Some tensors might have no names, get_any_name will throw exception in that case.
 								                    // -iop option will not work for those tensors.
 								                    name = item.get_any_name();
 								                    iop_precision = getPrecision2(user_precisions_map.at(item.get_any_name()));
 								                } catch (...) {
 								                }
 								                if (iop_precision != ov::element::undefined) {
 								                    type_to_set = iop_precision;
-												Benchmark_app batch calculation fix (#9554)

* BenchmarkApp - batch size calculation fix

* stylefix

* -ip/op fix

* stylefix
											
										
										
											2022-01-13 23:34:38 +03:00
+								                } else if (input_precision != ov::element::undefined) {
-												Benchmarkapp: Added processing of inputs/outputs by index (#9703)

* Added processing of inputs/outputs by index

* fix

* All tensor's get_friendly_name are replaced with get_any_name

* stylefix
											
										
										
											2022-01-18 13:40:54 +03:00
+								                    type_to_set = input_precision;
-												set U8 precision for image-like inputs even in case of random filling (#10140)


											
										
										
											2022-02-07 12:09:16 +03:00
+								                } else if (!name.empty() && app_inputs_info[0].at(name).is_image()) {
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                    // image input, set U8
-												Benchmarkapp: Added processing of inputs/outputs by index (#9703)

* Added processing of inputs/outputs by index

* fix

* All tensor's get_friendly_name are replaced with get_any_name

* stylefix
											
										
										
											2022-01-18 13:40:54 +03:00
+								                    type_to_set = ov::element::u8;
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                }
-												[Benchmark] Fixed preprocessing inputs (#10022)


											
										
										
											2022-01-31 17:05:44 +03:00
+								                auto& in = preproc.input(item.get_any_name());
-												Benchmarkapp: Added processing of inputs/outputs by index (#9703)

* Added processing of inputs/outputs by index

* fix

* All tensor's get_friendly_name are replaced with get_any_name

* stylefix
											
										
										
											2022-01-18 13:40:54 +03:00
+								                if (type_to_set != ov::element::undefined) {
 								                    in.tensor().set_element_type(type_to_set);
 								                    if (!name.empty()) {
 								                        for (auto& info : app_inputs_info) {
 								                            info.at(name).type = type_to_set;
 								                        }
 								                    }
-												Fix for Layout and image_info related issues (#10258)

* bugfix78627

* stylefix

* fix
											
										
										
											2022-02-17 00:42:51 +03:00
+								                }
 								                // Explicitly set inputs layout.
 								                if (!name.empty() && !app_inputs_info[0].at(name).layout.empty()) {
-												Benchmarkapp: Added processing of inputs/outputs by index (#9703)

* Added processing of inputs/outputs by index

* fix

* All tensor's get_friendly_name are replaced with get_any_name

* stylefix
											
										
										
											2022-01-18 13:40:54 +03:00
+								                    in.model().set_layout(app_inputs_info[0].at(name).layout);
 								                }
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								            }
-												Benchmarkapp: Added processing of inputs/outputs by index (#9703)

* Added processing of inputs/outputs by index

* fix

* All tensor's get_friendly_name are replaced with get_any_name

* stylefix
											
										
										
											2022-01-18 13:40:54 +03:00
+								            const auto& outs = model->outputs();
 								            for (int i = 0; i < outs.size(); i++) {
 								                const auto& item = outs[i];
 								                auto iop_precision = ov::element::undefined;
 								                try {
 								                    // Some tensors might have no names, get_any_name will throw exception in that case.
 								                    // -iop option will not work for those tensors.
 								                    iop_precision = getPrecision2(user_precisions_map.at(item.get_any_name()));
 								                } catch (...) {
 								                }
 								                if (iop_precision != ov::element::undefined) {
 								                    preproc.output(i).tensor().set_element_type(iop_precision);
-												Benchmark_app batch calculation fix (#9554)

* BenchmarkApp - batch size calculation fix

* stylefix

* -ip/op fix

* stylefix
											
										
										
											2022-01-13 23:34:38 +03:00
+								                } else if (output_precision != ov::element::undefined) {
-												Benchmarkapp: Added processing of inputs/outputs by index (#9703)

* Added processing of inputs/outputs by index

* fix

* All tensor's get_friendly_name are replaced with get_any_name

* stylefix
											
										
										
											2022-01-18 13:40:54 +03:00
+								                    preproc.output(i).tensor().set_element_type(output_precision);
-												Benchmark_app batch calculation fix (#9554)

* BenchmarkApp - batch size calculation fix

* stylefix

* -ip/op fix

* stylefix
											
										
										
											2022-01-13 23:34:38 +03:00
+								                }
 								            }
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								            model = preproc.build();
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
 								            // Check if network has dynamic shapes
 								            auto input_info = app_inputs_info[0];
 								            isDynamicNetwork = std::any_of(input_info.begin(),
 								                                           input_info.end(),
 								                                           [](const std::pair<std::string, benchmark_app::InputInfo>& i) {
 								                                               return i.second.partialShape.is_dynamic();
 								                                           });
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								            topology_name = model->get_friendly_name();
-												Benchmark_app batch calculation fix (#9554)

* BenchmarkApp - batch size calculation fix

* stylefix

* -ip/op fix

* stylefix
											
										
										
											2022-01-13 23:34:38 +03:00
 								            // Calculate batch size according to provided layout and shapes (static case)
 								            if (!isDynamicNetwork && app_inputs_info.size()) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                batchSize = get_batch_size(app_inputs_info.front());
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                slog::info << "Network batch size: " << batchSize << slog::endl;
 								            } else if (batchSize == 0) {
 								                batchSize = 1;
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            }
-												Update benchmark_app to pass precision via command line (#4318)

* Update benchmark_app to pass precision via command line

* Update vpu_perfcheck

* Update python benchmark_app to support setting precision from cmd

* Review comments

* Address more review comments

* Fixes after rebase
											
										
										
											2021-03-26 15:07:59 +03:00
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								            printInputAndOutputsInfoShort(*model);
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            // ----------------- 7. Loading the model to the device
 								            // --------------------------------------------------------
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            next_step();
 								            startTime = Time::now();
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								            compiledModel = core.compile_model(model, device_name);
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								            duration_ms = get_duration_ms_till_now(startTime);
 								            slog::info << "Load network took " << double_to_string(duration_ms) << " ms" << slog::endl;
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            if (statistics)
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                statistics->add_parameters(
 								                    StatisticsReport::Category::EXECUTION_RESULTS,
 								                    {StatisticsVariant("load network time (ms)", "load_network_time", duration_ms)});
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        } else {
 								            next_step();
 								            slog::info << "Skipping the step for compiled network" << slog::endl;
 								            next_step();
 								            slog::info << "Skipping the step for compiled network" << slog::endl;
 								            next_step();
 								            slog::info << "Skipping the step for compiled network" << slog::endl;
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            // ----------------- 7. Loading the model to the device
 								            // --------------------------------------------------------
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            next_step();
 								            auto startTime = Time::now();
-												Compiled network loading is fixed (#9547)

* compiled network loading is fixed

* StyleFix
											
										
										
											2022-01-10 23:37:46 +03:00
-												Fix for benchmark_app: set model stream flags (#9609)


											
										
										
											2022-01-13 10:15:33 +03:00
+								            std::ifstream modelStream(FLAGS_m, std::ios_base::binary | std::ios_base::in);
-												Compiled network loading is fixed (#9547)

* compiled network loading is fixed

* StyleFix
											
										
										
											2022-01-10 23:37:46 +03:00
+								            if (!modelStream.is_open()) {
 								                throw std::runtime_error("Cannot open model file " + FLAGS_m);
 								            }
 								            compiledModel = core.import_model(modelStream, device_name, {});
 								            modelStream.close();
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								            auto duration_ms = get_duration_ms_till_now(startTime);
 								            slog::info << "Import network took " << double_to_string(duration_ms) << " ms" << slog::endl;
-												[benchmark_app]Show network original I/O info (#10694)

* Show network original I/O info

* additional no-name case check

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
											
										
										
											2022-03-21 13:57:56 +03:00
+								            slog::info << "Original network I/O paramteters:" << slog::endl;
 								            printInputAndOutputsInfoShort(compiledModel);
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            if (statistics)
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                statistics->add_parameters(
 								                    StatisticsReport::Category::EXECUTION_RESULTS,
 								                    {StatisticsVariant("import network time (ms)", "import_network_time", duration_ms)});
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
-												Benchmark_app: Command line args processing is modified to use both tensor and corresponding node names (#9968)

* Node/name conversions

* stylefix
											
										
										
											2022-02-01 16:05:00 +03:00
+								            convert_io_names_in_map(inputFiles, compiledModel.inputs());
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								            app_inputs_info = get_inputs_info(FLAGS_shape,
 								                                              FLAGS_layout,
 								                                              FLAGS_b,
 								                                              FLAGS_data_shape,
 								                                              inputFiles,
 								                                              FLAGS_iscale,
 								                                              FLAGS_imean,
 								                                              compiledModel.inputs());
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								            if (batchSize == 0) {
 								                batchSize = 1;
 								            }
 								        }
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
 								        if (isDynamicNetwork && FLAGS_api == "sync") {
 								            throw std::logic_error("Benchmarking of the model with dynamic shapes is available for async API only."
 								                                   "Please use -api async -nstreams 1 -nireq 1 to emulate sync behavior");
 								        }
 								        // Defining of benchmark mode
 								        // for static models inference only mode is used as default one
 								        bool inferenceOnly = FLAGS_inference_only;
 								        if (isDynamicNetwork) {
 								            if (isFlagSetInCommandLine("inference_only") && inferenceOnly && app_inputs_info.size() != 1) {
 								                throw std::logic_error(
 								                    "Dynamic models with different input data shapes must be benchmarked only in full mode.");
 								            }
 								            inferenceOnly = isFlagSetInCommandLine("inference_only") && inferenceOnly && app_inputs_info.size() == 1;
 								        }
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								        // ----------------- 8. Querying optimal runtime parameters
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // -----------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												Enable THROUGHPUT by default for all the devices. (#9107)

* Set THROUGHPUT as the default configration for all the plugin and display the config of the plugin.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* updated format.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update benchmark python API.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Replace str 'THROUGHPUT' with CONFIG_VALUE(THROUGHPUT).

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Using CONFIG_VALUE(THROUGHPUT) replace 'THROUGHPUT' string.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* update code style.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Move the setting output code into the try block.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>
											
										
										
											2022-01-12 16:09:54 +08:00
+								        // output of the actual settings that the device selected
 								        for (const auto& device : devices) {
-												[AUTOPLUGIN] OV config 2.0 support  (#10191)

* add support for LOG_LEVEL and supported_properties

Signed-off-by: Hu, Yuan2 <yuan2.hu@intel.com>

* fix compile error

Signed-off-by: Hu, Yuan2 <yuan2.hu@intel.com>

* add test case for log_level and full_name

Signed-off-by: Hu, Yuan2 <yuan2.hu@intel.com>

* update to ov 2.0

Signed-off-by: fishbell <bell.song@intel.com>

* fix benchmark_app faild for AUTO:GPU, GPU

Signed-off-by: Hu, Yuan2 <yuan2.hu@intel.com>

* add case

Signed-off-by: fishbell <bell.song@intel.com>

* refine logic

Signed-off-by: fishbell <bell.song@intel.com>

* add test cases

Signed-off-by: fishbell <bell.song@intel.com>

* add more cases

Signed-off-by: fishbell <bell.song@intel.com>

* fix redifinition

Signed-off-by: fishbell <bell.song@intel.com>

* cpu plugin only in cpu tests

Signed-off-by: fishbell <bell.song@intel.com>

* typo in parameter

Signed-off-by: fishbell <bell.song@intel.com>

* use _core directly

Signed-off-by: fishbell <bell.song@intel.com>

* fix multi case failure

Signed-off-by: fishbell <bell.song@intel.com>

Co-authored-by: fishbell <bell.song@intel.com>
											
										
										
											2022-02-11 23:39:09 +08:00
+								            auto supported_properties = compiledModel.get_property(ov::supported_properties);
-												Enable THROUGHPUT by default for all the devices. (#9107)

* Set THROUGHPUT as the default configration for all the plugin and display the config of the plugin.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* updated format.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Update benchmark python API.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Replace str 'THROUGHPUT' with CONFIG_VALUE(THROUGHPUT).

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Using CONFIG_VALUE(THROUGHPUT) replace 'THROUGHPUT' string.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* update code style.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>

* Move the setting output code into the try block.

Signed-off-by: Wang, Yang <yang4.wang@intel.com>
											
										
										
											2022-01-12 16:09:54 +08:00
+								            slog::info << "Device: " << device << slog::endl;
-												New configuration API in set get property (#10012)

* New configuration API in set|get property

* removed supported metrics and keys

* Fixed build

* Fixed build

* Fixed samples build

* Fixed samples build

* Fixed build

* Removed old properties in plugin

* Fixed build
											
										
										
											2022-02-01 13:05:14 +03:00
+								            for (const auto& cfg : supported_properties) {
-												[GPU] Add new properties and fix bechmark_app (#10149)


											
										
										
											2022-02-09 09:18:54 +03:00
+								                try {
 								                    if (cfg == ov::supported_properties)
 								                        continue;
 								                    auto prop = compiledModel.get_property(cfg);
 								                    slog::info << "  { " << cfg << " , " << prop.as<std::string>() << " }" << slog::endl;
 								                } catch (const ov::Exception&) {
 								                }
-												OV Performance Hints (CPU and GPU logic for selecting the actual configs), while AUTO/MULTI are passing them thru) (#6993)

* rebasing the perf-modes-2021.3 to the 2021.4

Caveats:
the (explicit) setting #streams is not disabled (as it was before for experiments with DLBenchmark), and the logic slighlty differ (streamsSet)

(cherry picked from commit 1ae1edc0ed70fdea40f528fdaf8d00a9904d2a5c)

* overriding streams (to force the TPUT mode to the DLBenchnark)

(cherry picked from commit 7f506cda31abf35ac293d0dce32f602a0188c619)

* disabling reducing #streams to fully mimic baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments)

(cherry picked from commit 85073dd1dd2c7d43a89c37c8f646313f6ddfc650)

* clang/identation

(cherry picked from commit 050a4155a923cee294c8689d685b39247b7a172a)

* splitting the Transformation to general and CPU specific.

Now hopefully,this fully mimics the  baseline c4df94d42d90a2bc3cd91d3d6844ba42f29bca7f of the 2021.3 (before experiments), as the streams reduce num (as well as early exit on GRU/LSTM/TensorIterator) is deisabled

(cherry picked from commit e98b2c1a67f2542a686543594b75b575ef515196)

* disabling GRU/LSTM/TI + reducing of streams + 5D considered compute-limited only for int8

(cherry picked from commit 32b8d80dee18685ebf3d069bb4cd2172af7363b7)

* refactored to avoid compute_limited_ratio, reverted the reducing #streams, removed LSTM from limitations

(cherry picked from commit f2b972171b29cf599aae2407ceec2e6adb67e4e9)

* isa-based threshold logic

(cherry picked from commit b218457e1a93fcb3374eb9da948fdad2175ec33a)

* mode->hint

(cherry picked from commit ec20aa8ecaf3222f2a6fdfe9153cf6c9dfdd6a54)

* optional PERFORMANCE_HINT_NUM_REQUESTS

(cherry picked from commit 5a3883e3f36e7928c6391094ae10711c8e4c3b5c)

* moving the perfHints to the common OV config class + initial tests (CPU only, as the actual AUTO/MULTI should be accommodated on the master)

(cherry picked from commit (then fixed)45bafe7d527f466507dea0693aeed51be4ebf776)

* AUTO support for PerfHints

* MULTI support for PerfHints

* Enabling Perf hints for the GPU plugin

* brushing settings output a bit

* disabling "throughput" perf hint being default (until OV 2.0)

* uncommenting the logic which was disabled to force the DLBenchmark to use the throughput mode by default

* removing dead and experimental code, and debug printfs

* clang/code-style

* code-review remarks

* Moved the output of the actual params that the hint produced to the right place

* aligning MULTI's GetConfig beh to HETERO's as captured in the preso (CVS-59960) ratified with the ArchForum

* clang

* benchmark_app brushing

* Update inference-engine/samples/benchmark_app/README.md

* propagating the perf hints thru one more scenario in the merged AUTO-MULTI

* fixed mispint

* Python benchmark_app update for perf hints

* addresssing reviewers comments on the python benchmark_app

* simplifying/brushing logic a bit

* refactor the heuristic to the separate file (to be shared with iGPU soon)

* refactor conversion of modes to the specific GPU config per feedback from Vladimir
											
										
										
											2021-09-13 15:40:36 +03:00
+								            }
 								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        // Update number of streams
 								        for (auto&& ds : device_nstreams) {
-												[GPU] Add new properties and fix bechmark_app (#10149)


											
										
										
											2022-02-09 09:18:54 +03:00
+								            try {
 								                const std::string key = getDeviceTypeFromName(ds.first) + "_THROUGHPUT_STREAMS";
 								                device_nstreams[ds.first] = core.get_property(ds.first, key).as<std::string>();
 								            } catch (const ov::Exception&) {
-												Used new config for streams and threads (#10150)

* Used new config for streams and threads

* Fixed review coments in ba

* format fix

* fixed hello_query_device

* Added STL string io

* fixed tests

* Fixed test

* Fixed build

* fixed format

* Fixed build

* try fix win

* other any io specialization

* Fixed after merge

* renamed streams

* build fixed

* fixed build

* fixed format

* fix for old mac build

* Fixed type of exception

* test fix
											
										
										
											2022-02-11 09:22:45 +03:00
+								                device_nstreams[ds.first] = core.get_property(ds.first, ov::num_streams.name()).as<std::string>();
-												[GPU] Add new properties and fix bechmark_app (#10149)


											
										
										
											2022-02-09 09:18:54 +03:00
+								            }
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        // Number of requests
 								        uint32_t nireq = FLAGS_nireq;
 								        if (nireq == 0) {
-												Publishing 2020.2 content

											
										
										
											2020-04-13 21:17:23 +03:00
+								            if (FLAGS_api == "sync") {
 								                nireq = 1;
 								            } else {
 								                try {
-												PERF_COUNT replaced with ov::enable_profiling (#10118)

* String conversions in any

* Fixed chaching tests

* Fixed tests

* fixed build

* PERF_COUNT replaced with ov::enable_profiling

* fixed format

* fixed format

* fixed optimal config

* merge fix

* fix build

* format fix

Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
											
										
										
											2022-02-05 13:27:46 +03:00
+								                    nireq = compiledModel.get_property(ov::optimal_number_of_infer_requests);
-												Simplified IE Exceptions Implementation (#4258)


											
										
										
											2021-03-18 16:30:16 +03:00
+								                } catch (const std::exception& ex) {
-												Removed old headers from OV 2.0 API (#12214)

* Removed old headers from OV 2.0 API

* FIxed clang

* Fixed warning

* Updated OMZ submodule

* Fixed gpu tests build
											
										
										
											2022-08-12 11:35:36 +04:00
+								                    throw ov::Exception("Every device used with the benchmark_app should support " +
 								                                        std::string(ov::optimal_number_of_infer_requests.name()) +
 								                                        " Failed to query the metric for the " + device_name +
 								                                        " with error:" + ex.what());
-												Publishing 2020.2 content

											
										
										
											2020-04-13 21:17:23 +03:00
+								                }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								            }
 								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        // Iteration limit
 								        uint32_t niter = FLAGS_niter;
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        size_t shape_groups_num = app_inputs_info.size();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        if ((niter > 0) && (FLAGS_api == "async")) {
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            if (shape_groups_num > nireq) {
 								                niter = ((niter + shape_groups_num - 1) / shape_groups_num) * shape_groups_num;
 								                if (FLAGS_niter != niter) {
 								                    slog::warn << "Number of iterations was aligned by data shape groups number from " << FLAGS_niter
 								                               << " to " << niter << " using number of possible input shapes " << shape_groups_num
 								                               << slog::endl;
 								                }
 								            } else {
 								                niter = ((niter + nireq - 1) / nireq) * nireq;
 								                if (FLAGS_niter != niter) {
 								                    slog::warn << "Number of iterations was aligned by request number from " << FLAGS_niter << " to "
 								                               << niter << " using number of requests " << nireq << slog::endl;
 								                }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            }
-												Publishing R5 content (#72)

* Publishing R5 content

* Updated ade revision

* updated readme

* add possibility to build CPU plugin with Intel MKL package

											
										
										
											2019-01-21 21:31:31 +03:00
+								        }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        // Time limit
 								        uint32_t duration_seconds = 0;
 								        if (FLAGS_t != 0) {
 								            // time limit
 								            duration_seconds = FLAGS_t;
 								        } else if (FLAGS_niter == 0) {
 								            // default time limit
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								            duration_seconds = device_default_device_duration_in_seconds(device_name);
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        }
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								        uint64_t duration_nanoseconds = get_duration_in_nanoseconds(duration_seconds);
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								        if (statistics) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								            statistics->add_parameters(
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								                StatisticsReport::Category::RUNTIME_CONFIG,
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                StatisticsReport::Parameters(
 								                    {StatisticsVariant("benchmark mode", "benchmark_mode", inferenceOnly ? "inference only" : "full"),
 								                     StatisticsVariant("topology", "topology", topology_name),
 								                     StatisticsVariant("target device", "target_device", device_name),
 								                     StatisticsVariant("API", "api", FLAGS_api),
 								                     StatisticsVariant("precision", "precision", type.get_type_name()),
 								                     StatisticsVariant("batch size", "batch_size", batchSize),
 								                     StatisticsVariant("number of iterations", "iterations_num", niter),
 								                     StatisticsVariant("number of parallel infer requests", "nireq", nireq),
 								                     StatisticsVariant("duration (ms)", "duration", get_duration_in_milliseconds(duration_seconds))}));
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								            for (auto& nstreams : device_nstreams) {
 								                std::stringstream ss;
 								                ss << "number of " << nstreams.first << " streams";
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
 								                std::string dev_name = nstreams.first;
 								                std::transform(dev_name.begin(), dev_name.end(), dev_name.begin(), [](unsigned char c) {
 								                    return c == ' ' ? '_' : std::tolower(c);
 								                });
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                statistics->add_parameters(StatisticsReport::Category::RUNTIME_CONFIG,
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                                           {StatisticsVariant(ss.str(), dev_name + "_streams_num", nstreams.second)});
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								            }
 								        }
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // ----------------- 9. Creating infer requests and filling input blobs
 								        // ----------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								        InferRequestsQueue inferRequestsQueue(compiledModel, nireq, app_inputs_info.size(), FLAGS_pcseq);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
 								        bool inputHasName = false;
 								        if (inputFiles.size() > 0) {
 								            inputHasName = inputFiles.begin()->first != "";
 								        }
 								        bool newInputType = isDynamicNetwork || inputHasName;
 								        // create vector to store remote input blobs buffer
 								        std::vector<::gpu::BufferType> clInputsBuffer;
 								        bool useGpuMem = false;
-												Removed ov::runtime namespace (#9781)

* Removed ov::runtime namespace

* clang-format

* Fixes

* template reference

* Fixes
											
										
										
											2022-01-20 16:17:57 +03:00
+								        std::map<std::string, ov::TensorVector> inputsData;
-												Add `use_device_mem` option to benchmark_app (#7433)


											
										
										
											2021-09-17 11:04:50 +03:00
+								        if (isFlagSetInCommandLine("use_device_mem")) {
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            if (device_name.find("GPU") == 0) {
-												creating remote ocl buffer/tensor per request, to avoid simulteneous locking of the same ocl buffer when auto-batching is used (#10607)


											
										
										
											2022-02-28 15:04:03 +03:00
+								                inputsData = ::gpu::get_remote_input_tensors(inputFiles,
 								                                                             app_inputs_info,
 								                                                             compiledModel,
 								                                                             clInputsBuffer,
 								                                                             inferRequestsQueue.requests.size());
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                useGpuMem = true;
 								            } else if (device_name.find("CPU") == 0) {
 								                if (newInputType) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                    inputsData = get_tensors(inputFiles, app_inputs_info);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                } else {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                    inputsData = get_tensors_static_case(
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                        inputFiles.empty() ? std::vector<std::string>{} : inputFiles.begin()->second,
 								                        batchSize,
 								                        app_inputs_info[0],
 								                        nireq);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                }
 								            } else {
-												Removed old headers from OV 2.0 API (#12214)

* Removed old headers from OV 2.0 API

* FIxed clang

* Fixed warning

* Updated OMZ submodule

* Fixed gpu tests build
											
										
										
											2022-08-12 11:35:36 +04:00
+								                throw ov::Exception("Requested device doesn't support `use_device_mem` option.");
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            }
-												Add `use_device_mem` option to benchmark_app (#7433)


											
										
										
											2021-09-17 11:04:50 +03:00
+								        } else {
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            if (newInputType) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                inputsData = get_tensors(inputFiles, app_inputs_info);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            } else {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                inputsData = get_tensors_static_case(
 								                    inputFiles.empty() ? std::vector<std::string>{} : inputFiles.begin()->second,
 								                    batchSize,
 								                    app_inputs_info[0],
 								                    nireq);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            }
-												Add `use_device_mem` option to benchmark_app (#7433)


											
										
										
											2021-09-17 11:04:50 +03:00
+								        }
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // ----------------- 10. Measuring performance
 								        // ------------------------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        size_t progressCnt = 0;
 								        size_t progressBarTotalCount = progressBarDefaultTotalCount;
 								        size_t iteration = 0;
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        std::stringstream ss;
-												Fix spelling errors in samples and documentation (#2795)

* Fix spelling errors in samples

* Fix spelling errors in the documentation
											
										
										
											2020-11-11 15:35:39 +03:00
+								        ss << "Start inference " << FLAGS_api << "hronously";
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        if (FLAGS_api == "async") {
 								            if (!ss.str().empty()) {
 								                ss << ", ";
 								            }
 								            ss << nireq << " inference requests";
 								            std::stringstream device_ss;
 								            for (auto& nstreams : device_nstreams) {
 								                if (!device_ss.str().empty()) {
 								                    device_ss << ", ";
 								                }
 								                device_ss << nstreams.second << " streams for " << nstreams.first;
 								            }
 								            if (!device_ss.str().empty()) {
 								                ss << " using " << device_ss.str();
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								            }
 								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        ss << ", limits: ";
 								        if (duration_seconds > 0) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								            ss << get_duration_in_milliseconds(duration_seconds) << " ms duration";
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        if (niter != 0) {
 								            if (duration_seconds == 0) {
 								                progressBarTotalCount = niter;
 								            }
 								            if (duration_seconds > 0) {
 								                ss << ", ";
 								            }
 								            ss << niter << " iterations";
 								        }
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step(ss.str());
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        if (inferenceOnly) {
 								            slog::info << "BENCHMARK IS IN INFERENCE ONLY MODE." << slog::endl;
 								            slog::info << "Input blobs will be filled once before performance measurements." << slog::endl;
 								        } else {
 								            slog::info << "BENCHMARK IS IN FULL MODE." << slog::endl;
 								            slog::info << "Inputs setup stage will be included in performance measurements." << slog::endl;
 								        }
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								        // copy prepared data straight into inferRequest->getTensor()
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        // for inference only mode
 								        if (inferenceOnly) {
 								            if (nireq < inputsData.begin()->second.size())
 								                slog::warn << "Only " << nireq << " test configs will be used." << slog::endl;
 								            size_t i = 0;
 								            for (auto& inferRequest : inferRequestsQueue.requests) {
 								                auto inputs = app_inputs_info[i % app_inputs_info.size()];
 								                for (auto& item : inputs) {
 								                    auto inputName = item.first;
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                    const auto& inputTensor = inputsData.at(inputName)[i % inputsData.at(inputName).size()];
 								                    // for remote blobs setTensor is used, they are already allocated on the device
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                    if (useGpuMem) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                        inferRequest->set_tensor(inputName, inputTensor);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                    } else {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                        auto requestTensor = inferRequest->get_tensor(inputName);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                        if (isDynamicNetwork) {
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                            requestTensor.set_shape(inputTensor.get_shape());
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                        }
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                        copy_tensor_data(requestTensor, inputTensor);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                    }
 								                }
 								                if (useGpuMem) {
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                    auto outputTensors =
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                        ::gpu::get_remote_output_tensors(compiledModel, inferRequest->get_output_cl_buffer());
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                    for (auto& output : compiledModel.outputs()) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                        inferRequest->set_tensor(output.get_any_name(), outputTensors[output.get_any_name()]);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                    }
 								                }
 								                ++i;
 								            }
 								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        // warming up - out of scope
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								        auto inferRequest = inferRequestsQueue.get_idle_request();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        if (!inferRequest) {
-												Removed old headers from OV 2.0 API (#12214)

* Removed old headers from OV 2.0 API

* FIxed clang

* Fixed warning

* Updated OMZ submodule

* Fixed gpu tests build
											
										
										
											2022-08-12 11:35:36 +04:00
+								            throw ov::Exception("No idle Infer Requests!");
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        }
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
 								        if (!inferenceOnly) {
 								            auto inputs = app_inputs_info[0];
 								            for (auto& item : inputs) {
 								                auto inputName = item.first;
 								                const auto& data = inputsData.at(inputName)[0];
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                inferRequest->set_tensor(inputName, data);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            }
 								            if (useGpuMem) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                auto outputTensors =
 								                    ::gpu::get_remote_output_tensors(compiledModel, inferRequest->get_output_cl_buffer());
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                for (auto& output : compiledModel.outputs()) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                    inferRequest->set_tensor(output.get_any_name(), outputTensors[output.get_any_name()]);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                }
 								            }
 								        }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        if (FLAGS_api == "sync") {
 								            inferRequest->infer();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        } else {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								            inferRequest->start_async();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        }
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								        inferRequestsQueue.wait_all();
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								        auto duration_ms = inferRequestsQueue.get_latencies()[0];
 								        slog::info << "First inference took " << double_to_string(duration_ms) << " ms" << slog::endl;
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
 								        if (statistics) {
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								            statistics->add_parameters(
 								                StatisticsReport::Category::EXECUTION_RESULTS,
 								                {StatisticsVariant("first inference time (ms)", "first_inference_time", duration_ms)});
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        }
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								        inferRequestsQueue.reset_times();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        size_t processedFramesN = 0;
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								        auto startTime = Time::now();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        auto execTime = std::chrono::duration_cast<ns>(Time::now() - startTime).count();
 								        /** Start inference & calculate performance **/
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        /** to align number if iterations to guarantee that last infer requests are
 								         * executed in the same conditions **/
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        ProgressBar progressBar(progressBarTotalCount, FLAGS_stream_output, FLAGS_progress);
-												Update samples style (#6998)

* Align clang config with IE

* Apply code style

* Update code style for c samples

* Fixed style for c samples
											
										
										
											2021-08-11 14:47:29 +03:00
+								        while ((niter != 0LL && iteration < niter) ||
 								               (duration_nanoseconds != 0LL && (uint64_t)execTime < duration_nanoseconds) ||
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								               (FLAGS_api == "async" && iteration % nireq != 0)) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								            inferRequest = inferRequestsQueue.get_idle_request();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            if (!inferRequest) {
-												Removed old headers from OV 2.0 API (#12214)

* Removed old headers from OV 2.0 API

* FIxed clang

* Fixed warning

* Updated OMZ submodule

* Fixed gpu tests build
											
										
										
											2022-08-12 11:35:36 +04:00
+								                throw ov::Exception("No idle Infer Requests!");
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            }
-												Publishing R5 content (#72)

* Publishing R5 content

* Updated ade revision

* updated readme

* add possibility to build CPU plugin with Intel MKL package

											
										
										
											2019-01-21 21:31:31 +03:00
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            if (!inferenceOnly) {
 								                auto inputs = app_inputs_info[iteration % app_inputs_info.size()];
 								                if (FLAGS_pcseq) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                    inferRequest->set_latency_group_id(iteration % app_inputs_info.size());
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                }
 								                if (isDynamicNetwork) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                    batchSize = get_batch_size(inputs);
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                    if (!std::any_of(inputs.begin(),
 								                                     inputs.end(),
 								                                     [](const std::pair<const std::string, benchmark_app::InputInfo>& info) {
 								                                         return ov::layout::has_batch(info.second.layout);
 								                                     })) {
 								                        slog::warn
 								                            << "No batch dimension was found, asssuming batch to be 1. Beware: this might affect "
 								                               "FPS calculation."
 								                            << slog::endl;
 								                    }
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                }
 								                for (auto& item : inputs) {
 								                    auto inputName = item.first;
 								                    const auto& data = inputsData.at(inputName)[iteration % inputsData.at(inputName).size()];
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                    inferRequest->set_tensor(inputName, data);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                }
 								                if (useGpuMem) {
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                    auto outputTensors =
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                        ::gpu::get_remote_output_tensors(compiledModel, inferRequest->get_output_cl_buffer());
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                    for (auto& output : compiledModel.outputs()) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                        inferRequest->set_tensor(output.get_any_name(), outputTensors[output.get_any_name()]);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                    }
 								                }
 								            }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            if (FLAGS_api == "sync") {
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								                inferRequest->infer();
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								            } else {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                // As the inference request is currently idle, the wait() adds no
 								                // additional overhead (and should return immediately). The primary
 								                // reason for calling the method is exception checking/re-throwing.
 								                // Callback, that governs the actual execution can handle errors as
 								                // well, but as it uses just error codes it has no details like ‘what()’
 								                // method of `std::exception` So, rechecking for any exceptions here.
-												Publishing 2020.1 content

											
										
										
											2020-02-11 22:48:49 +03:00
+								                inferRequest->wait();
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                inferRequest->start_async();
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								            }
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            ++iteration;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            execTime = std::chrono::duration_cast<ns>(Time::now() - startTime).count();
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            processedFramesN += batchSize;
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            if (niter > 0) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                progressBar.add_progress(1);
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            } else {
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								                // calculate how many progress intervals are covered by current
 								                // iteration. depends on the current iteration time and time of each
 								                // progress interval. Previously covered progress intervals must be
 								                // skipped.
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								                auto progressIntervalTime = duration_nanoseconds / progressBarTotalCount;
 								                size_t newProgress = execTime / progressIntervalTime - progressCnt;
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                progressBar.add_progress(newProgress);
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								                progressCnt += newProgress;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								            }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        // wait the latest inference executions
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								        inferRequestsQueue.wait_all();
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								        LatencyMetrics generalLatency(inferRequestsQueue.get_latencies(), "", FLAGS_latency_percentile);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        std::vector<LatencyMetrics> groupLatencies = {};
 								        if (FLAGS_pcseq && app_inputs_info.size() > 1) {
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								            const auto& lat_groups = inferRequestsQueue.get_latency_groups();
 								            for (int i = 0; i < lat_groups.size(); i++) {
 								                const auto& lats = lat_groups[i];
 								                std::string data_shapes_string = "";
 								                for (auto& item : app_inputs_info[i]) {
 								                    data_shapes_string += item.first + get_shape_string(item.second.dataShape) + ",";
 								                }
 								                data_shapes_string =
 								                    data_shapes_string == "" ? "" : data_shapes_string.substr(0, data_shapes_string.size() - 1);
 								                groupLatencies.emplace_back(lats, data_shapes_string, FLAGS_latency_percentile);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            }
 								        }
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								        double totalDuration = inferRequestsQueue.get_duration_in_milliseconds();
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								        double fps = (FLAGS_api == "sync") ? batchSize * 1000.0 / generalLatency.median_or_percentile
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                                           : 1000.0 * processedFramesN / totalDuration;
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
 								        if (statistics) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								            statistics->add_parameters(StatisticsReport::Category::EXECUTION_RESULTS,
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                                       {StatisticsVariant("total execution time (ms)", "execution_time", totalDuration),
 								                                        StatisticsVariant("total number of iterations", "iterations_num", iteration)});
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								            if (device_name.find("MULTI") == std::string::npos) {
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								                std::string latency_label;
 								                if (FLAGS_latency_percentile == 50) {
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                    latency_label = "Median latency (ms)";
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								                } else {
 								                    latency_label = "latency (" + std::to_string(FLAGS_latency_percentile) + " percentile) (ms)";
 								                }
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                statistics->add_parameters(
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                    StatisticsReport::Category::EXECUTION_RESULTS,
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                    {StatisticsVariant(latency_label, "latency_median", generalLatency.median_or_percentile),
 								                     StatisticsVariant("Percentile boundary", "percentile_boundary", FLAGS_latency_percentile),
 								                     StatisticsVariant("Average latency (ms)", "latency_avg", generalLatency.avg),
 								                     StatisticsVariant("Min latency (ms)", "latency_min", generalLatency.min),
-												Fix for missing throughput in case of Multi device (#10407)

* Fix for missing throughput in case of Multi device

* stylefix
											
										
										
											2022-02-17 16:32:19 +03:00
+								                     StatisticsVariant("Max latency (ms)", "latency_max", generalLatency.max)});
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
 								                if (FLAGS_pcseq && app_inputs_info.size() > 1) {
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                    for (size_t i = 0; i < groupLatencies.size(); ++i) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                        statistics->add_parameters(
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                            StatisticsReport::Category::EXECUTION_RESULTS_GROUPPED,
 								                            {StatisticsVariant("Group Latencies", "group_latencies", groupLatencies[i])});
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                    }
 								                }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								            }
-												Fix for missing throughput in case of Multi device (#10407)

* Fix for missing throughput in case of Multi device

* stylefix
											
										
										
											2022-02-17 16:32:19 +03:00
+								            statistics->add_parameters(StatisticsReport::Category::EXECUTION_RESULTS,
 								                                       {StatisticsVariant("throughput", "throughput", fps)});
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        }
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        progressBar.finish();
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								        // ----------------- 11. Dumping statistics report
 								        // -------------------------------------------------------------
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								        next_step();
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        if (!FLAGS_dump_config.empty()) {
 								            dump_config(FLAGS_dump_config, config);
-												DOCS: ported changes from 2022.1 release branch (#11206)

* Extensibility guide with FE extensions and remove OV_FRAMEWORK_MAP from docs

* Rework of Extensibility Intro, adopted examples to missing OPENVINO_FRAMEWORK_MAP

* Removed OPENVINO_FRAMEWORK_MAP reference

* Frontend extension detailed documentation

* Fixed distributed snippets

* Fixed snippet inclusion in FE extension document and chapter headers

* Fixed wrong name in a snippet reference

* Fixed test for template extension due to changed number of loaded extensions

* Update docs/Extensibility_UG/frontend_extensions.md

Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>

* Minor fixes in extension snippets

* Small grammar fix

Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>

Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>

* DOCS: transition banner (#10973)

* transition banner

* minor fix

* update transition banner

* updates

* update custom.js

* updates

* updates

* Documentation fixes (#11044)

* Benchmark app usage

* Fixed link to the devices

* More fixes

* Update docs/OV_Runtime_UG/multi_device.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Removed several hardcoded links

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Updated documentation for compile_tool (#11049)

* Added deployment guide (#11060)

* Added deployment guide

* Added local distribution

* Updates

* Fixed more indentations

* Removed obsolete code snippets (#11061)

* Removed obsolete code snippets

* NCC style

* Fixed NCC for BA

* Add a troubleshooting issue for PRC installation (#11074)

* updates

* adding gna to linux

* add missing reference

* update

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* Update docs/install_guides/installing-model-dev-tools.md

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* update

* minor updates

* add gna item to yum and apt

* add gna to get started page

* update reference formatting

* merge commit

* add a troubleshooting issue

* update

* update

* fix CVS-71846

Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>

* DOCS: fixed hardcoded links  (#11100)

* Fixes

* Use links

* applying reviewers comments to the Opt Guide (#11093)

* applying reviewrs comments

* fixed refs, more structuring (bold, bullets, etc)

* refactoring tput/latency sections

* next iteration (mostly latency), also brushed the auto-batching and other sections

* updates sync/async images

* common opts brushed

* WIP tput redesigned

* minor brushing of common and auto-batching

* Tput fully refactored

* fixed doc name in the link

* moved int8 perf counters to the right section

* fixed links

* fixed broken quotes

* fixed more links

* add ref to the internals to the TOC

* Added a note on the batch size

Co-authored-by: Andrey Zaytsev <andrey.zaytsev@intel.com>

* [80085] New images for docs (#11114)

* change doc structure

* fix manager tools

* fix manager tools 3 step

* fix manager tools 3 step

* new img

* new img for OV Runtime

* fix steps

* steps

* fix intendents

* change list

* fix space

* fix space

* code snippets fix

* change display

* Benchmarks 2022 1 (#11130)

* Minor fixes

* Updates for 2022.1

* Edits according to the review

* Edits according to review comments

* Edits according to review comments

* Edits according to review comments

* Fixed table

* Edits according to review comments

* Removed config for Intel® Core™ i7-11850HE

* Removed forward-tacotron-duration-prediction-241 graph

* Added resnet-18-pytorch

* Add info about Docker images in Deployment guide (#11136)

* Renamed user guides (#11137)

* fix screenshot (#11140)

* More conservative recommendations on dynamic shapes usage in docs (#11161)

* More conservative recommendations about using dynamic shapes

* Duplicated statement from C++ part to Python part of reshape doc (no semantical changes)

* Update ShapeInference.md (#11168)

* Benchmarks 2022 1 updates (#11180)

* Updated graphs

* Quick fix for TODO in Dynamic Shapes article

* Anchor link fixes

* Fixed DM config (#11199)

* DOCS: doxy sphinxtabs (#11027)

* initial implementation of doxy sphinxtabs

* fixes

* fixes

* fixes

* fixes

* fixes

* WA for ignored visibility attribute

* Fixes

Co-authored-by: Sergey Lyalin <sergey.lyalin@intel.com>
Co-authored-by: Ivan Tikhonov <ivan.tikhonov@intel.com>
Co-authored-by: Nikolay Tyukaev <nikolay.tyukaev@intel.com>
Co-authored-by: Sergey Lyubimtsev <sergey.lyubimtsev@intel.com>
Co-authored-by: Yuan Xu <yuan1.xu@intel.com>
Co-authored-by: Maxim Shevtsov <maxim.y.shevtsov@intel.com>
Co-authored-by: Andrey Zaytsev <andrey.zaytsev@intel.com>
Co-authored-by: Tatiana Savina <tatiana.savina@intel.com>
Co-authored-by: Ilya Naumov <ilya.naumov@intel.com>
Co-authored-by: Evgenya Stepyreva <evgenya.stepyreva@intel.com>
											
										
										
											2022-03-24 22:27:29 +03:00
+								            slog::info << "OpenVINO Runtime configuration settings were dumped to " << FLAGS_dump_config << slog::endl;
-												publish master branch snapshot, revision cdcab9d7ab48ffb0ee5629fabbfa06cb45debd9b

											
										
										
											2020-04-15 19:01:57 +03:00
+								        }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
+								        if (!FLAGS_exec_graph_path.empty()) {
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            try {
-												[core][python] ov::serialize (#10945)

* add ov::serialize

* create python binding

* update python tools

* use ov::serialize in benchmark app

* remove serialize from python offline_transformations

* fix import

* revert pot

* update docs

* apply review comments

* add const

* make bin path optional

* Add docs

* add compare test
											
										
										
											2022-03-23 11:44:00 +03:00
+								                ov::serialize(compiledModel.get_runtime_model(), FLAGS_exec_graph_path);
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								                slog::info << "executable graph is stored to " << FLAGS_exec_graph_path << slog::endl;
-												refactor: add clang style check for samples (#5306)

* refactor: add clang style check for samples

* fix: add .clang-format for ie

* fix: style check for missing headers

* refactor: remove cpplint for IE samples

* fix: setw is not a member of std for classification_results.hpp

* feat: add indent after ifdefine

* feat: set up google style for IE samples

* fix indents for w_dirent headers

* fix: include issues for utils.cpp due to clang-format
											
										
										
											2021-04-22 14:02:54 +03:00
+								            } catch (const std::exception& ex) {
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								                slog::err << "Can't get executable graph: " << ex.what() << slog::endl;
 								            }
 								        }
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								        if (perf_counts) {
-												Removed ov::runtime namespace (#9781)

* Removed ov::runtime namespace

* clang-format

* Fixes

* template reference

* Fixes
											
										
										
											2022-01-20 16:17:57 +03:00
+								            std::vector<std::vector<ov::ProfilingInfo>> perfCounts;
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            for (size_t ireq = 0; ireq < nireq; ireq++) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                auto reqPerfCounts = inferRequestsQueue.requests[ireq]->get_performance_counts();
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								                if (FLAGS_pc) {
-												Typo for cross-check tool (#4350)


											
										
										
											2021-02-16 13:08:54 +09:00
+								                    slog::info << "Performance counts for " << ireq << "-th infer request:" << slog::endl;
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                    printPerformanceCounts(reqPerfCounts, std::cout, getFullDeviceName(core, FLAGS_d), false);
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								                }
 								                perfCounts.push_back(reqPerfCounts);
 								            }
 								            if (statistics) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                statistics->dump_performance_counters(perfCounts);
-												Publishing 2019 R2 content (#223)



											
										
										
											2019-08-09 19:02:42 +03:00
+								            }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        }
-												Publishing 2019 R1 content

											
										
										
											2019-04-12 18:25:53 +03:00
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								        if (statistics)
 								            statistics->dump();
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        // Performance metrics report
 								        slog::info << "Count:      " << iteration << " iterations" << slog::endl;
 								        slog::info << "Duration:   " << double_to_string(totalDuration) << " ms" << slog::endl;
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								        if (device_name.find("MULTI") == std::string::npos) {
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								            slog::info << "Latency: " << slog::endl;
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								            generalLatency.write_to_slog();
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
 								            if (FLAGS_pcseq && app_inputs_info.size() > 1) {
 								                slog::info << "Latency for each data shape group:" << slog::endl;
 								                for (size_t i = 0; i < app_inputs_info.size(); ++i) {
 								                    slog::info << (i + 1) << ".";
 								                    for (auto& item : app_inputs_info[i]) {
 								                        std::stringstream input_shape;
 								                        auto shape = item.second.dataShape;
-												benchmark_app with dynamic reshapes and API 2.0 (#8609)

* API 2.0 changes

* stylefix

* Update samples/cpp/benchmark_app/main.cpp

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>

* Update samples/cpp/benchmark_app/infer_request_wrap.hpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* Update samples/cpp/benchmark_app/utils.cpp

Co-authored-by: Ilya Churaev <ilyachur@gmail.com>

* fixes

* fix for: gpu headers are moved to another folder... yet again

* fix for mac build paranoia

* function,classes and files renames/change logic to work with inputs()

* stylefix

* 2nd portion of fixes

* stylefix

* Batch warnings

Co-authored-by: Nadezhda Ageeva <nkogteva@gmail.com>
Co-authored-by: Ilya Churaev <ilyachur@gmail.com>
											
										
										
											2021-12-30 19:09:12 +03:00
+								                        std::copy(shape.begin(), shape.end() - 1, std::ostream_iterator<size_t>(input_shape, ","));
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                        input_shape << shape.back();
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								                        slog::info << " " << item.first << " : " << get_shape_string(item.second.dataShape);
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                    }
 								                    slog::info << slog::endl;
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                    groupLatencies[i].write_to_slog();
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								                }
-												Intoduce -latency_percentile flag for the benchmark_app tool (#6479)

* Introduce new -latency_percentile flag for benchmark_app

* Fix syntax
											
										
										
											2021-07-23 10:29:55 +03:00
+								            }
 								        }
-												Dynamic reshapes (#7788)

* Merged and compiling

* Fix for dynamic shape type

* review fixes

* renamed blob shape to tensor shape, small improvements

* fix code style

* added parsing of multiple shapes

* store latency per group, add isIdleRequestAvailable() to Infer Queue

* added cached random inputs

* redesign pipeline, added new metrics(avg, max, min), added metrics per groups

* fixed code style

* small improvements

* modified tensor parameters parsing

* modified -i parameter parsing: added possibility to specify input names

* implemented image cashing

* added cashed blobs creating

* added -pcseq flag, modified batch filling, changes fps formula

* improvements

* code formatting

* code formatting2

* apply suggestions from review

* replaced Buffer class with InferenceEngine Blobs

* use batch size in blobs filling

* added shared blob allocator to handle blob's data

* fixed warnings & code style

* allocate blobs

* fix for networks with image info input

* added comments & fixed codestyle

* clear data in free() in SharedBlobAllocator

* remove unnecessary check

* Delimeter is changed to ::

* stylefix

* added layout from string function, small improvements

* modified parsing to enable : in input parameters

* small fixes

* small fixes

* added missed blob allocation, fixes

* [TEST]added support for remote blobs

* fix remote blobs

* new inputs/files output format

* removed vectors resize which caused bugs

* made cl::Buffer type under ifdef, fix inputs filling

* changed batch() function to not throwing exceptions

* removed unused var

* fix code style

* replace empty name in input files with name from net input

* restored old behaviour for static models

* fix code style

* fix warning - made const iterator

* fix warning - remove reference in loop variable

* added random and image_info input types to -i, fix problem with layout

* replaced batch() with getBatchSize() in main

* fix layout, shape, tensor shape parameters parsing

* upd help messages for input, tensor shape and pcseq command

* added buffer for cl output blobs, small fixes

Signed-off-by: ivikhrev <ivan.vikhrev@intel.com>

* added legacy mode

* restore setBlob

* code style formatting

* move collecting latency for groups under flag

* removed not applicable layouts

* added hint to error message when wrong input name in -tensor_shape was specified

* added new metrics to statistics report

* Apply suggestions from code review

* fix binary blobs filling when layout is CN

* apply suggestions

* moved file in the right place after rebase

* improved -pcseq output

* updated args and readme

* removed TEMPLATE plugin registration

* fix -shape arg  decsription

* enable providing several -i args as input

* renamed legacy_mode to inference_only and made it default for static models, renamed tensor_shape to data_shape

* upd readme

* use getBlob() in inference only mode

* fix old input type for static case

* fix typo

* upd readme

* move log about benchmark mode to the measuring perfomance step

* added class for latency metrics

* upd readme, fix typos, renamed funcs

* fix warning and upd parsing to avoid error with : in file paths

* fix error on centos : error: use of deleted function ‘std::basic_stringstream<char>::basic_stringstream(const std::basic_stringstream<char>&)

* added check for key in inputs

* renamed input to inputs

* adjust batch size for binary blobs

* replaced warning with exception in bench mode defining

* align measurement cycle with master

Co-authored-by: ivikhrev <ivan.vikhrev@intel.com>
											
										
										
											2021-12-17 12:20:43 +03:00
+								        slog::info << "Throughput: " << double_to_string(fps) << " FPS" << slog::endl;
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								    } catch (const std::exception& ex) {
 								        slog::err << ex.what() << slog::endl;
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
 								        if (statistics) {
-												[IE SAMPLES] activated NCC tool for c++ samples (#9600)

* [IE SAMPLES] activated NCC tool for c++ samples

* exclude ov_ncc_naming_style for tests

* fixed NCC hit

* Added support for source files in samples

* changed style of methods for benchmark

* changed style for speech sample

* changed code style

* changed code style for shared_tensor

* benchmark changes

* changed remote_tensors_filling

* fixed notes

* rebase of branch
											
										
										
											2022-01-19 01:08:07 +03:00
+								            statistics->add_parameters(StatisticsReport::Category::EXECUTION_RESULTS,
-												Benchmark_app: JSON writer for statistics (#9887)

* Refactored statistics output with JSON support

* Detailed/average reports are added

* stylefix

* Update samples/cpp/benchmark_app/statistics_report.hpp

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>

* Linux Fixes

* stylefixes

* data_shape field format is changed

* stylefix

Co-authored-by: Ivan Vikhrev <ivan.vikhrev@intel.com>
											
										
										
											2022-02-03 01:47:46 +03:00
+								                                       {StatisticsVariant("error", "error", ex.what())});
-												Publishing 2019 R3 content

											
										
										
											2019-10-04 19:26:43 +03:00
+								            statistics->dump();
 								        }
-												Publishing R4 (#41)

* Publishing R4

											
										
										
											2018-11-23 16:19:43 +03:00
+								        return 3;
 								    }
 								    return 0;
 								}