Adds support of user layouts to benchmark_app (#4002)

* Adds support of user layouts to benchmark_app * Keep snake_case for python Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
2021-02-11 12:57:05 +03:00 · 2021-02-11 12:57:05 +03:00 · 4e3d7d23fc
commit 4e3d7d23fc
parent 2a2ef7d989
13 changed files with 419 additions and 252 deletions
--- a/inference-engine/samples/benchmark_app/README.md
+++ b/inference-engine/samples/benchmark_app/README.md
@ -92,6 +92,7 @@ Options:
    -t                        Optional. Time, in seconds, to execute topology.
    -progress                 Optional. Show progress bar (can affect performance measurement). Default values is "false".
    -shape                    Optional. Set shape for input. For example, "input1[1,3,224,224],input2[1,4]" or "[1,3,224,224]" in case of one input size.
+    -layout                   Optional. Prompts how network layouts should be treated by application. For example, "input1[NCHW],input2[NC]" or "[NCHW]" in case of one input size.

  CPU-specific performance options:
    -nstreams "<integer>"     Optional. Number of streams to use for inference on the CPU, GPU or MYRIAD devices
--- a/inference-engine/samples/benchmark_app/benchmark_app.hpp
+++ b/inference-engine/samples/benchmark_app/benchmark_app.hpp
@ -1,4 +1,4 @@
-// Copyright (C) 2018-2020 Intel Corporation
+// Copyright (C) 2018-2021 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //

@ -102,6 +102,9 @@ static const char dump_config_message[] = "Optional. Path to XML/YAML/JSON file
 static const char shape_message[] = "Optional. Set shape for input. For example, \"input1[1,3,224,224],input2[1,4]\" or \"[1,3,224,224]\""
                                    " in case of one input size.";

+static const char layout_message[] = "Optional. Prompts how network layouts should be treated by application. "
+                                     "For example, \"input1[NCHW],input2[NC]\" or \"[NCHW]\" in case of one input size.";
+
 // @brief message for quantization bits
 static const char gna_qb_message[] = "Optional. Weight bits for quantization:  8 or 16 (default)";

@ -189,6 +192,9 @@ DEFINE_string(dump_config, "", dump_config_message);
 /// @brief Define flag for input shape <br>
 DEFINE_string(shape, "", shape_message);

+/// @brief Define flag for layout shape <br>
+DEFINE_string(layout, "", layout_message);
+
 /// @brief Define flag for quantization bits (default 16)
 DEFINE_int32(qb, 16, gna_qb_message);

@ -215,6 +221,7 @@ static void showUsage() {
    std::cout << "    -t                        " << execution_time_message << std::endl;
    std::cout << "    -progress                 " << progress_message << std::endl;
    std::cout << "    -shape                    " << shape_message << std::endl;
+    std::cout << "    -layout                   " << layout_message << std::endl;
    std::cout << std::endl << "  device-specific performance options:" << std::endl;
    std::cout << "    -nstreams \"<integer>\"     " << infer_num_streams_message << std::endl;
    std::cout << "    -nthreads \"<integer>\"     " << infer_num_threads_message << std::endl;
--- a/inference-engine/samples/benchmark_app/inputs_filling.cpp
+++ b/inference-engine/samples/benchmark_app/inputs_filling.cpp
@ -1,4 +1,4 @@
-// Copyright (C) 2018-2020 Intel Corporation
+// Copyright (C) 2018-2021 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //

@ -48,7 +48,7 @@ std::vector<std::string> filterFilesByExtensions(const std::vector<std::string>&
 void fillBlobImage(Blob::Ptr& inputBlob,
                  const std::vector<std::string>& filePaths,
                  const size_t& batchSize,
-                  const InputInfo& info,
+                  const benchmark_app::InputInfo& app_info,
                  const size_t& requestId,
                  const size_t& inputId,
                  const size_t& inputSize) {
@ -60,7 +60,6 @@ void fillBlobImage(Blob::Ptr& inputBlob,
    // locked memory holder should be alive all time while access to its buffer happens
    auto minputHolder = minput->wmap();
    auto inputBlobData = minputHolder.as<uint8_t *>();
-    const TensorDesc& inputBlobDesc = inputBlob->getTensorDesc();

    /** Collect images data ptrs **/
    std::vector<std::shared_ptr<uint8_t>> vreader;
@ -77,24 +76,30 @@ void fillBlobImage(Blob::Ptr& inputBlob,
        }

        /** Getting image data **/
-        TensorDesc desc = info.getTensorDesc();
-        std::shared_ptr<uint8_t> imageData(reader->getData(getTensorWidth(desc), getTensorHeight(desc)));
+        std::shared_ptr<uint8_t> imageData(reader->getData(app_info.width(), app_info.height()));
        if (imageData) {
            vreader.push_back(imageData);
        }
    }

    /** Fill input tensor with images. First b channel, then g and r channels **/
-    const size_t numChannels = getTensorChannels(inputBlobDesc);
-    const size_t imageSize = getTensorWidth(inputBlobDesc) * getTensorHeight(inputBlobDesc);
+    const size_t numChannels = app_info.channels();
+    const size_t width = app_info.width();
+    const size_t height = app_info.height();
    /** Iterate over all input images **/
    for (size_t imageId = 0; imageId < vreader.size(); ++imageId) {
-        /** Iterate over all pixel in image (b,g,r) **/
-        for (size_t pid = 0; pid < imageSize; pid++) {
+        /** Iterate over all width **/
+        for (size_t w = 0; w < app_info.width(); ++w) {
+            /** Iterate over all height **/
+            for (size_t h = 0; h < app_info.height(); ++h) {
                /** Iterate over all channels **/
                for (size_t ch = 0; ch < numChannels; ++ch) {
                    /**          [images stride + channels stride + pixel id ] all in bytes            **/
-                inputBlobData[imageId * imageSize * numChannels + ch * imageSize + pid] = vreader.at(imageId).get()[pid*numChannels + ch];
+                    size_t offset = imageId * numChannels * width * height +
+                            (((app_info.layout == "NCHW") || (app_info.layout == "CHW")) ?
+                             (ch * width * height + h * width + w) : (h * width * numChannels + w * numChannels + ch));
+                    inputBlobData[offset] = vreader.at(imageId).get()[h * width * numChannels + w * numChannels + ch];
+                }
            }
        }
    }
@ -185,24 +190,23 @@ void fillBlobImInfo(Blob::Ptr& inputBlob,

 void fillBlobs(const std::vector<std::string>& inputFiles,
               const size_t& batchSize,
-               const InferenceEngine::ConstInputsDataMap& info,
+               benchmark_app::InputsInfo& app_inputs_info,
               std::vector<InferReqWrap::Ptr> requests) {
    std::vector<std::pair<size_t, size_t>> input_image_sizes;
-    for (const ConstInputsDataMap::value_type& item : info) {
-        if (isImage(item.second)) {
-            input_image_sizes.push_back(std::make_pair(getTensorWidth(item.second->getTensorDesc()),
-                                                       getTensorHeight(item.second->getTensorDesc())));
+    for (auto& item : app_inputs_info) {
+        if (item.second.isImage()) {
+            input_image_sizes.push_back(std::make_pair(item.second.width(), item.second.height()));
        }
-        slog::info << "Network input '" << item.first << "' precision " << item.second->getTensorDesc().getPrecision()
-                                                      << ", dimensions (" << item.second->getTensorDesc().getLayout() << "): ";
-        for (const auto& i : item.second->getTensorDesc().getDims()) {
+        slog::info << "Network input '" << item.first << "' precision " << item.second.precision
+                                                      << ", dimensions (" << item.second.layout << "): ";
+        for (const auto& i : item.second.shape) {
            slog::info << i << " ";
        }
        slog::info << slog::endl;
    }

    size_t imageInputCount = input_image_sizes.size();
-    size_t binaryInputCount = info.size() - imageInputCount;
+    size_t binaryInputCount = app_inputs_info.size() - imageInputCount;

    std::vector<std::string> binaryFiles;
    std::vector<std::string> imageFiles;
@ -258,26 +262,28 @@ void fillBlobs(const std::vector<std::string>& inputFiles,

        size_t imageInputId = 0;
        size_t binaryInputId = 0;
-        for (const ConstInputsDataMap::value_type& item : info) {
+        for (auto& item : app_inputs_info) {
            Blob::Ptr inputBlob = requests.at(requestId)->getBlob(item.first);
-            if (isImage(inputBlob)) {
+            auto app_info = app_inputs_info.at(item.first);
+            auto precision = app_info.precision;
+            if (app_info.isImage()) {
                if (!imageFiles.empty()) {
                    // Fill with Images
-                    fillBlobImage(inputBlob, imageFiles, batchSize, *item.second, requestId, imageInputId++, imageInputCount);
+                    fillBlobImage(inputBlob, imageFiles, batchSize, app_info, requestId, imageInputId++, imageInputCount);
                    continue;
                }
            } else {
                if (!binaryFiles.empty()) {
                    // Fill with binary files
-                    if (item.second->getPrecision() == InferenceEngine::Precision::FP32) {
+                    if (precision == InferenceEngine::Precision::FP32) {
                        fillBlobBinary<float>(inputBlob, binaryFiles, batchSize, requestId, binaryInputId++, binaryInputCount);
-                    } else if (item.second->getPrecision() == InferenceEngine::Precision::FP16) {
+                    } else if (precision == InferenceEngine::Precision::FP16) {
                        fillBlobBinary<short>(inputBlob, binaryFiles, batchSize, requestId, binaryInputId++, binaryInputCount);
-                    } else if (item.second->getPrecision() == InferenceEngine::Precision::I32) {
+                    } else if (precision == InferenceEngine::Precision::I32) {
                        fillBlobBinary<int32_t>(inputBlob, binaryFiles, batchSize, requestId, binaryInputId++, binaryInputCount);
-                    } else if (item.second->getPrecision() == InferenceEngine::Precision::I64) {
+                    } else if (precision == InferenceEngine::Precision::I64) {
                        fillBlobBinary<int64_t>(inputBlob, binaryFiles, batchSize, requestId, binaryInputId++, binaryInputCount);
-                    } else if (item.second->getPrecision() == InferenceEngine::Precision::U8) {
+                    } else if (precision == InferenceEngine::Precision::U8) {
                        fillBlobBinary<uint8_t>(inputBlob, binaryFiles, batchSize, requestId, binaryInputId++, binaryInputCount);
                    } else {
                        THROW_IE_EXCEPTION << "Input precision is not supported for " << item.first;
@ -285,18 +291,18 @@ void fillBlobs(const std::vector<std::string>& inputFiles,
                    continue;
                }

-                if (isImageInfo(inputBlob) && (input_image_sizes.size() == 1)) {
+                if (app_info.isImageInfo() && (input_image_sizes.size() == 1)) {
                    // Most likely it is image info: fill with image information
                    auto image_size = input_image_sizes.at(0);
                    slog::info << "Fill input '" << item.first << "' with image size " << image_size.first << "x"
                                                                                       << image_size.second << slog::endl;
-                    if (item.second->getPrecision() == InferenceEngine::Precision::FP32) {
+                    if (precision == InferenceEngine::Precision::FP32) {
                        fillBlobImInfo<float>(inputBlob, batchSize, image_size);
-                    } else if (item.second->getPrecision() == InferenceEngine::Precision::FP16) {
+                    } else if (precision == InferenceEngine::Precision::FP16) {
                        fillBlobImInfo<short>(inputBlob, batchSize, image_size);
-                    } else if (item.second->getPrecision() == InferenceEngine::Precision::I32) {
+                    } else if (precision == InferenceEngine::Precision::I32) {
                        fillBlobImInfo<int32_t>(inputBlob, batchSize, image_size);
-                    } else if (item.second->getPrecision() == InferenceEngine::Precision::I64) {
+                    } else if (precision == InferenceEngine::Precision::I64) {
                        fillBlobImInfo<int64_t>(inputBlob, batchSize, image_size);
                    } else {
                        THROW_IE_EXCEPTION << "Input precision is not supported for image info!";
@ -306,23 +312,23 @@ void fillBlobs(const std::vector<std::string>& inputFiles,
            }
            // Fill random
            slog::info << "Fill input '" << item.first << "' with random values ("
-                       << std::string((isImage(inputBlob) ? "image" : "some binary data"))
+                       << std::string((app_info.isImage() ? "image" : "some binary data"))
                       << " is expected)" << slog::endl;
-            if (item.second->getPrecision() == InferenceEngine::Precision::FP32) {
+            if (precision == InferenceEngine::Precision::FP32) {
                fillBlobRandom<float>(inputBlob);
-            } else if (item.second->getPrecision() == InferenceEngine::Precision::FP16) {
+            } else if (precision == InferenceEngine::Precision::FP16) {
                fillBlobRandom<short>(inputBlob);
-            } else if (item.second->getPrecision() == InferenceEngine::Precision::I32) {
+            } else if (precision == InferenceEngine::Precision::I32) {
                fillBlobRandom<int32_t>(inputBlob);
-            } else if (item.second->getPrecision() == InferenceEngine::Precision::I64) {
+            } else if (precision == InferenceEngine::Precision::I64) {
                fillBlobRandom<int64_t>(inputBlob);
-            } else if (item.second->getPrecision() == InferenceEngine::Precision::U8) {
+            } else if (precision == InferenceEngine::Precision::U8) {
                fillBlobRandom<uint8_t>(inputBlob);
-            } else if (item.second->getPrecision() == InferenceEngine::Precision::I8) {
+            } else if (precision == InferenceEngine::Precision::I8) {
                fillBlobRandom<int8_t>(inputBlob);
-            } else if (item.second->getPrecision() == InferenceEngine::Precision::U16) {
+            } else if (precision == InferenceEngine::Precision::U16) {
                fillBlobRandom<uint16_t>(inputBlob);
-            } else if (item.second->getPrecision() == InferenceEngine::Precision::I16) {
+            } else if (precision == InferenceEngine::Precision::I16) {
                fillBlobRandom<int16_t>(inputBlob);
            } else {
                THROW_IE_EXCEPTION << "Input precision is not supported for " << item.first;
--- a/inference-engine/samples/benchmark_app/inputs_filling.hpp
+++ b/inference-engine/samples/benchmark_app/inputs_filling.hpp
@ -1,4 +1,4 @@
-// Copyright (C) 2018-2020 Intel Corporation
+// Copyright (C) 2018-2021 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //

@ -9,29 +9,10 @@

 #include <inference_engine.hpp>

+#include "utils.hpp"
 #include "infer_request_wrap.hpp"

-template<typename T>
-static bool isImage(const T &blob) {
-    auto descriptor = blob->getTensorDesc();
-    if (descriptor.getLayout() != InferenceEngine::NCHW) {
-        return false;
-    }
-    auto channels = descriptor.getDims()[1];
-    return channels == 3;
-}
-
-template<typename T>
-static bool isImageInfo(const T &blob) {
-    auto descriptor = blob->getTensorDesc();
-    if (descriptor.getLayout() != InferenceEngine::NC) {
-        return false;
-    }
-    auto channels = descriptor.getDims()[1];
-    return (channels >= 2);
-}
-
 void fillBlobs(const std::vector<std::string>& inputFiles,
               const size_t& batchSize,
-               const InferenceEngine::ConstInputsDataMap& info,
+               benchmark_app::InputsInfo& app_inputs_info,
               std::vector<InferReqWrap::Ptr> requests);
--- a/inference-engine/samples/benchmark_app/main.cpp
+++ b/inference-engine/samples/benchmark_app/main.cpp
@ -1,4 +1,4 @@
-// Copyright (C) 2018-2020 Intel Corporation
+// Copyright (C) 2018-2021 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //

@ -320,6 +320,8 @@ int main(int argc, char *argv[]) {
        size_t batchSize = FLAGS_b;
        Precision precision = Precision::UNSPECIFIED;
        std::string topology_name = "";
+        benchmark_app::InputsInfo app_inputs_info;
+        std::string output_name;
        if (!isNetworkCompiled) {
            // ----------------- 4. Reading the Intermediate Representation network ----------------------------------------
            next_step();
@ -345,15 +347,12 @@ int main(int argc, char *argv[]) {
            next_step();
            batchSize = cnnNetwork.getBatchSize();
            // Parse input shapes if specified
-            InferenceEngine::ICNNNetwork::InputShapes shapes = cnnNetwork.getInputShapes();
            bool reshape = false;
-            if (!FLAGS_shape.empty()) {
-                reshape |= updateShapes(shapes, FLAGS_shape, inputInfo);
-            }
-            if ((FLAGS_b != 0) && (batchSize != FLAGS_b)) {
-                reshape |= adjustShapesBatch(shapes, FLAGS_b, inputInfo);
-            }
+            app_inputs_info = getInputsInfo<InputInfo::Ptr>(FLAGS_shape, FLAGS_layout, FLAGS_b, inputInfo, reshape);
            if (reshape) {
+                InferenceEngine::ICNNNetwork::InputShapes shapes = {};
+                for (auto& item : app_inputs_info)
+                    shapes[item.first] = item.second.shape;
                slog::info << "Reshaping network: " << getShapesString(shapes) << slog::endl;
                startTime = Time::now();
                cnnNetwork.reshape(shapes);
@ -365,7 +364,9 @@ int main(int argc, char *argv[]) {
                                                    {"reshape network time (ms)", duration_ms}
                                            });
            }
-            batchSize = cnnNetwork.getBatchSize();
+            // use batch size according to provided layout and shapes
+            batchSize = (!FLAGS_layout.empty()) ? getBatchSize(app_inputs_info) : cnnNetwork.getBatchSize();
+
            topology_name = cnnNetwork.getName();
            slog::info << (FLAGS_b != 0 ? "Network batch size was changed to: " : "Network batch size: ") << batchSize << slog::endl;

@ -373,9 +374,10 @@ int main(int argc, char *argv[]) {
            next_step();

            for (auto& item : inputInfo) {
-                if (isImage(item.second)) {
+                if (app_inputs_info.at(item.first).isImage()) {
                    /** Set the precision of input data provided by the user, should be called before load of the network to the device **/
-                    item.second->setPrecision(Precision::U8);
+                    app_inputs_info.at(item.first).precision = Precision::U8;
+                    item.second->setPrecision(app_inputs_info.at(item.first).precision);
                }
            }
            // ----------------- 7. Loading the model to the device --------------------------------------------------------
@ -407,6 +409,7 @@ int main(int argc, char *argv[]) {
                                          {
                                                  {"import network time (ms)", duration_ms}
                                          });
+            app_inputs_info = getInputsInfo<InputInfo::CPtr>(FLAGS_shape, FLAGS_layout, FLAGS_b, exeNetwork.GetInputsInfo());
            if (batchSize == 0) {
                batchSize = 1;
            }
@ -485,8 +488,7 @@ int main(int argc, char *argv[]) {
        next_step();

        InferRequestsQueue inferRequestsQueue(exeNetwork, nireq);
-        const InferenceEngine::ConstInputsDataMap info(exeNetwork.GetInputsInfo());
-        fillBlobs(inputFiles, batchSize, info, inferRequestsQueue.requests);
+        fillBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests);

        // ----------------- 10. Measuring performance ------------------------------------------------------------------
        size_t progressCnt = 0;
--- a/inference-engine/samples/benchmark_app/utils.cpp
+++ b/inference-engine/samples/benchmark_app/utils.cpp
@ -1,4 +1,4 @@
-// Copyright (C) 2018-2020 Intel Corporation
+// Copyright (C) 2018-2021 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //

@ -8,6 +8,7 @@
 #include <vector>
 #include <map>
 #include <regex>
+#include <iostream>

 #include <samples/common.hpp>
 #include <samples/slog.hpp>
@ -18,6 +19,41 @@
 #include <opencv2/core.hpp>
 #endif

+namespace benchmark_app {
+    bool InputInfo::isImage() const {
+        if ((layout != "NCHW") && (layout != "NHWC") &&
+            (layout != "CHW") && (layout != "HWC"))
+            return false;
+        return (channels() == 3);
+    }
+    bool InputInfo::isImageInfo() const {
+        if (layout != "NC")
+            return false;
+        return (channels() >= 2);
+    }
+    size_t InputInfo::getDimentionByLayout(char character) const {
+        size_t pos = layout.find(character);
+        if (pos == std::string::npos)
+            throw std::runtime_error("Error: Can't get " + std::string(character, 1) + " from layout " + layout);
+        return shape.at(pos);
+    }
+    size_t InputInfo::width() const {
+        return getDimentionByLayout('W');
+    }
+    size_t InputInfo::height() const {
+        return getDimentionByLayout('H');
+    }
+    size_t InputInfo::channels() const {
+        return getDimentionByLayout('C');
+    }
+    size_t InputInfo::batch() const {
+        return getDimentionByLayout('N');
+    }
+    size_t InputInfo::depth() const {
+        return getDimentionByLayout('D');
+    }
+} // namespace benchmark_app
+
 uint32_t deviceDefaultDeviceDurationInSeconds(const std::string& device) {
    static const std::map<std::string, uint32_t> deviceDefaultDurationInSeconds {
            { "CPU",     60  },
@ -102,61 +138,20 @@ std::map<std::string, std::string> parseNStreamsValuePerDevice(const std::vector
    return result;
 }

-bool adjustShapesBatch(InferenceEngine::ICNNNetwork::InputShapes& shapes,
-                       const size_t batch_size, const InferenceEngine::InputsDataMap& input_info) {
-    bool updated = false;
-    for (auto& item : input_info) {
-        auto layout = item.second->getTensorDesc().getLayout();
-
-        int batch_index = -1;
-        if ((layout == InferenceEngine::Layout::NCHW) || (layout == InferenceEngine::Layout::NCDHW) ||
-            (layout == InferenceEngine::Layout::NHWC) || (layout == InferenceEngine::Layout::NDHWC) ||
-            (layout == InferenceEngine::Layout::NC)) {
-            batch_index = 0;
-        } else if (layout == InferenceEngine::Layout::CN) {
-            batch_index = 1;
-        }
-        if ((batch_index != -1) && (shapes.at(item.first).at(batch_index) != batch_size)) {
-            shapes[item.first][batch_index] = batch_size;
-            updated = true;
+size_t getBatchSize(const benchmark_app::InputsInfo& inputs_info) {
+    size_t batch_size = 0;
+    for (auto& info : inputs_info) {
+        std::size_t batch_index = info.second.layout.find("N");
+        if (batch_index != std::string::npos) {
+            if (batch_size == 0)
+                batch_size = info.second.shape[batch_index];
+            else if (batch_size != info.second.shape[batch_index])
+                throw std::logic_error("Can't deterimine batch size: batch is different for different inputs!");
        }
    }
-    return updated;
-}
-
-bool updateShapes(InferenceEngine::ICNNNetwork::InputShapes& shapes,
-                  const std::string shapes_string, const InferenceEngine::InputsDataMap& input_info) {
-    bool updated = false;
-    std::string search_string = shapes_string;
-    auto start_pos = search_string.find_first_of('[');
-    while (start_pos != std::string::npos) {
-        auto end_pos = search_string.find_first_of(']');
-        if (end_pos == std::string::npos)
-            break;
-        auto input_name = search_string.substr(0, start_pos);
-        auto input_shape = search_string.substr(start_pos + 1, end_pos - start_pos - 1);
-        std::vector<size_t> parsed_shape;
-        for (auto& dim : split(input_shape, ',')) {
-            parsed_shape.push_back(std::stoi(dim));
-        }
-        if (!input_name.empty()) {
-            shapes[input_name] = parsed_shape;
-            updated = true;
-        } else {
-            for (auto& item : input_info) {
-                shapes[item.first] = parsed_shape;
-            }
-            updated = true;
-        }
-        search_string = search_string.substr(end_pos + 1);
-        if (search_string.empty() || search_string.front() != ',')
-            break;
-        search_string = search_string.substr(1);
-        start_pos = search_string.find_first_of('[');
-    }
-    if (!search_string.empty())
-        throw std::logic_error("Can't parse `shape` parameter: " + shapes_string);
-    return updated;
+    if (batch_size == 0)
+        batch_size = 1;
+    return batch_size;
 }

 std::string getShapesString(const InferenceEngine::ICNNNetwork::InputShapes& shapes) {
--- a/inference-engine/samples/benchmark_app/utils.hpp
+++ b/inference-engine/samples/benchmark_app/utils.hpp
@ -1,4 +1,4 @@
-// Copyright (C) 2018-2020 Intel Corporation
+// Copyright (C) 2018-2021 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //

@ -8,15 +8,119 @@
 #include <vector>
 #include <map>

+namespace benchmark_app {
+    struct InputInfo {
+        InferenceEngine::Precision precision;
+        InferenceEngine::SizeVector shape;
+        std::string layout;
+        bool isImage() const;
+        bool isImageInfo() const;
+        size_t getDimentionByLayout(char character) const;
+        size_t width() const;
+        size_t height() const;
+        size_t channels() const;
+        size_t batch() const;
+        size_t depth() const;
+    };
+    using InputsInfo = std::map<std::string, InputInfo>;
+}
+
 std::vector<std::string> parseDevices(const std::string& device_string);
 uint32_t deviceDefaultDeviceDurationInSeconds(const std::string& device);
 std::map<std::string, std::string> parseNStreamsValuePerDevice(const std::vector<std::string>& devices,
                                                               const std::string& values_string);
-bool updateShapes(InferenceEngine::ICNNNetwork::InputShapes& shapes,
-                  const std::string shapes_string, const InferenceEngine::InputsDataMap& input_info);
-bool adjustShapesBatch(InferenceEngine::ICNNNetwork::InputShapes& shapes,
-                       const size_t batch_size, const InferenceEngine::InputsDataMap& input_info);
 std::string getShapesString(const InferenceEngine::ICNNNetwork::InputShapes& shapes);
+size_t getBatchSize(const benchmark_app::InputsInfo& inputs_info);
+std::vector<std::string> split(const std::string &s, char delim);
+
+template <typename T>
+std::map<std::string, std::string> parseInputParameters(const std::string parameter_string,
+                                                        const std::map<std::string, T>& input_info) {
+    // Parse parameter string like "input0[value0],input1[value1]" or "[value]" (applied to all inputs)
+    std::map<std::string, std::string> return_value;
+    std::string search_string = parameter_string;
+    auto start_pos = search_string.find_first_of('[');
+    while (start_pos != std::string::npos) {
+        auto end_pos = search_string.find_first_of(']');
+        if (end_pos == std::string::npos)
+            break;
+        auto input_name = search_string.substr(0, start_pos);
+        auto input_value = search_string.substr(start_pos + 1, end_pos - start_pos - 1);
+        if (!input_name.empty()) {
+            return_value[input_name] = input_value;
+        } else {
+            for (auto& item : input_info) {
+                return_value[item.first] = input_value;
+            }
+        }
+        search_string = search_string.substr(end_pos + 1);
+        if (search_string.empty() || search_string.front() != ',')
+            break;
+        search_string = search_string.substr(1);
+        start_pos = search_string.find_first_of('[');
+    }
+    if (!search_string.empty())
+        throw std::logic_error("Can't parse input parameter string: " + parameter_string);
+    return return_value;
+}
+
+template <typename T>
+benchmark_app::InputsInfo getInputsInfo(const std::string& shape_string,
+                                        const std::string& layout_string,
+                                        const size_t batch_size,
+                                        const std::map<std::string, T>& input_info,
+                                        bool& reshape_required) {
+    std::map<std::string, std::string> shape_map = parseInputParameters(shape_string, input_info);
+    std::map<std::string, std::string> layout_map = parseInputParameters(layout_string, input_info);
+    reshape_required = false;
+    benchmark_app::InputsInfo info_map;
+    for (auto& item : input_info) {
+        benchmark_app::InputInfo info;
+        auto name = item.first;
+        auto descriptor = item.second->getTensorDesc();
+        // Precision
+        info.precision = descriptor.getPrecision();
+        // Shape
+        if (shape_map.count(name)) {
+            std::vector<size_t> parsed_shape;
+            for (auto& dim : split(shape_map.at(name), ',')) {
+                parsed_shape.push_back(std::stoi(dim));
+            }
+            info.shape = parsed_shape;
+            reshape_required = true;
+        } else {
+            info.shape = descriptor.getDims();
+        }
+        // Layout
+        if (layout_map.count(name)) {
+            info.layout = layout_map.at(name);
+            std::transform(info.layout.begin(), info.layout.end(), info.layout.begin(), ::toupper);
+        } else {
+            std::stringstream ss;
+            ss << descriptor.getLayout();
+            info.layout = ss.str();
+        }
+        // Update shape with batch if needed
+        if (batch_size != 0) {
+            std::size_t batch_index = info.layout.find("N");
+            if ((batch_index != std::string::npos) && (info.shape.at(batch_index) != batch_size)) {
+                info.shape[batch_index] = batch_size;
+                reshape_required = true;
+            }
+        }
+        info_map[name] = info;
+    }
+    return info_map;
+}
+
+template <typename T>
+benchmark_app::InputsInfo getInputsInfo(const std::string& shape_string,
+                                        const std::string& layout_string,
+                                        const size_t batch_size,
+                                        const std::map<std::string, T>& input_info) {
+    bool reshape_required = false;
+    return getInputsInfo<T>(shape_string, layout_string, batch_size, input_info, reshape_required);
+}

 #ifdef USE_OPENCV
 void dump_config(const std::string& filename,
--- a/inference-engine/tools/benchmark_tool/README.md
+++ b/inference-engine/tools/benchmark_tool/README.md
@ -109,6 +109,13 @@ Options:
  -t TIME, --time TIME  Optional. Time in seconds to execute topology.
  -progress [PROGRESS]  Optional. Show progress bar (can affect performance
                        measurement). Default values is "False".
+  -shape SHAPE          Optional. Set shape for input. For example,
+                        "input1[1,3,224,224],input2[1,4]" or "[1,3,224,224]"
+                        in case of one input size.
+  -layout LAYOUT        Optional. Prompts how network layouts should be
+                        treated by application. For example,
+                        "input1[NCHW],input2[NC]" or "[NCHW]" in case of one
+                        input size.
  -nstreams NUMBER_STREAMS, --number_streams NUMBER_STREAMS
                       Optional. Number of streams to use for inference on the CPU/GPU in throughput mode
                       (for HETERO and MULTI device cases use format <device1>:<nstreams1>,<device2>:<nstreams2> or just <nstreams>).
--- a/tools/benchmark/README.md
+++ b/tools/benchmark/README.md
@ -103,8 +103,12 @@ Options:
  -progress [PROGRESS]  Optional. Show progress bar (can affect performance
                        measurement). Default values is "False".
  -shape SHAPE          Optional. Set shape for input. For example,
-                        "input1[1,3,224,224],input2[1,4]" or "[1,3,224,224]" in
-                        case of one input size.
+                        "input1[1,3,224,224],input2[1,4]" or "[1,3,224,224]"
+                        in case of one input size.
+  -layout LAYOUT        Optional. Prompts how network layouts should be
+                        treated by application. For example,
+                        "input1[NCHW],input2[NC]" or "[NCHW]" in case of one
+                        input size.
  -nstreams NUMBER_STREAMS, --number_streams NUMBER_STREAMS
                       Optional. Number of streams to use for inference on the CPU/GPU/MYRIAD
                       (for HETERO and MULTI device cases use format <device1>:<nstreams1>,<device2>:<nstreams2> or just <nstreams>).
--- a/tools/benchmark/main.py
+++ b/tools/benchmark/main.py
@ -11,8 +11,8 @@ from openvino.tools.benchmark.utils.logging import logger
 from openvino.tools.benchmark.utils.progress_bar import ProgressBar
 from openvino.tools.benchmark.utils.utils import next_step, config_network_inputs, get_number_iterations, \
    process_help_inference_string, print_perf_counters, dump_exec_graph, get_duration_in_milliseconds, \
-    get_command_line_arguments, parse_nstreams_value_per_device, parse_devices, update_shapes, \
-    adjust_shapes_batch, load_config, dump_config
+    get_command_line_arguments, parse_nstreams_value_per_device, parse_devices, get_inputs_info, \
+    get_batch_size, load_config, dump_config
 from openvino.tools.benchmark.utils.statistics_report import StatisticsReport, averageCntReport, detailedCntReport


@ -193,15 +193,10 @@ def run(args):
            # --------------------- 5. Resizing network to match image sizes and given batch ---------------------------
            next_step()

-            shapes = {k: v.input_data.shape.copy() for k, v in ie_network.input_info.items()}
-            reshape = False
-            if args.shape:
-                reshape |= update_shapes(shapes, args.shape, ie_network.input_info)
-            if args.batch_size and args.batch_size != ie_network.batch_size:
-                reshape |= adjust_shapes_batch(shapes, args.batch_size, ie_network.input_info)
-
+            app_inputs_info, reshape = get_inputs_info(args.shape, args.layout, args.batch_size, ie_network.input_info)
            if reshape:
                start_time = datetime.utcnow()
+                shapes = { k : v.shape for k,v in app_inputs_info.items() }
                logger.info(
                    'Reshaping network: {}'.format(', '.join("'{}': {}".format(k, v) for k, v in shapes.items())))
                ie_network.reshape(shapes)
@ -213,13 +208,15 @@ def run(args):
                                                  ('reshape network time (ms)', duration_ms)
                                              ])

-            batch_size = ie_network.batch_size
-            logger.info('Network batch size: {}'.format(ie_network.batch_size))
+            # use batch size according to provided layout and shapes
+            batch_size = get_batch_size(app_inputs_info) if args.layout else ie_network.batch_size
+
+            logger.info('Network batch size: {}'.format(batch_size))

            # --------------------- 6. Configuring input of the model --------------------------------------------------
            next_step()

-            config_network_inputs(ie_network)
+            config_network_inputs(ie_network, app_inputs_info)

            # --------------------- 7. Loading the model to the device -------------------------------------------------
            next_step()
@ -253,6 +250,7 @@ def run(args):
                                          [
                                              ('import network time (ms)', duration_ms)
                                          ])
+            app_inputs_info, _ = get_inputs_info(args.shape, args.layout, args.batch_size, exe_network.input_info)
            if batch_size == 0:
                batch_size = 1

@ -277,7 +275,7 @@ def run(args):
        if args.paths_to_input:
            for path in args.paths_to_input:
                paths_to_input.append(os.path.abspath(*path) if args.paths_to_input else None)
-        set_inputs(paths_to_input, batch_size, exe_network.input_info, infer_requests)
+        set_inputs(paths_to_input, batch_size, app_inputs_info, infer_requests)

        if statistics:
            statistics.add_parameters(StatisticsReport.Category.RUNTIME_CONFIG,
--- a/tools/benchmark/parameters.py
+++ b/tools/benchmark/parameters.py
@ -68,6 +68,10 @@ def parse_args():
    args.add_argument('-shape', type=str, required=False, default='',
                      help='Optional. '
                           'Set shape for input. For example, "input1[1,3,224,224],input2[1,4]" or "[1,3,224,224]" in case of one input size.')
+    args.add_argument('-layout', type=str, required=False, default='',
+                      help='Optional. '
+                           'Prompts how network layouts should be treated by application. '
+                           'For example, "input1[NCHW],input2[NC]" or "[NCHW]" in case of one input size.')
    args.add_argument('-nstreams', '--number_streams', type=str, required=False, default=None,
                      help='Optional. Number of streams to use for inference on the CPU/GPU/MYRIAD '
                           '(for HETERO and MULTI device cases use format <device1>:<nstreams1>,<device2>:<nstreams2> '
--- a/tools/benchmark/utils/inputs_filling.py
+++ b/tools/benchmark/utils/inputs_filling.py
@ -1,5 +1,5 @@
 """
- Copyright (C) 2018-2020 Intel Corporation
+ Copyright (C) 2018-2021 Intel Corporation

 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@ -22,21 +22,8 @@ from glob import glob
 from .constants import IMAGE_EXTENSIONS, BINARY_EXTENSIONS
 from .logging import logger

-def is_image(blob):
-    if blob.layout != "NCHW":
-        return False
-    channels = blob.shape[1]
-    return channels == 3
-
-
-def is_image_info(blob):
-    if blob.layout != "NC":
-        return False
-    channels = blob.shape[1]
-    return channels >= 2
-
-def set_inputs(paths_to_input, batch_size, input_info, requests):
-  requests_input_data = get_inputs(paths_to_input, batch_size, input_info, requests)
+def set_inputs(paths_to_input, batch_size, app_input_info, requests):
+  requests_input_data = get_inputs(paths_to_input, batch_size, app_input_info, requests)
  for i in range(len(requests)):
    inputs = requests[i].input_blobs
    for k, v in requests_input_data[i].items():
@ -44,19 +31,20 @@ def set_inputs(paths_to_input, batch_size, input_info, requests):
            raise Exception("No input with name {} found!".format(k))
        inputs[k].buffer[:] = v

-def get_inputs(paths_to_input, batch_size, input_info, requests):
+def get_inputs(paths_to_input, batch_size, app_input_info, requests):
    input_image_sizes = {}
-    for key in sorted(input_info.keys()):
-        if is_image(input_info[key].input_data):
-            input_image_sizes[key] = (input_info[key].input_data.shape[2], input_info[key].input_data.shape[3])
+    for key in sorted(app_input_info.keys()):
+        info = app_input_info[key]
+        if info.is_image:
+            input_image_sizes[key] = (info.width, info.height)
        logger.info("Network input '{}' precision {}, dimensions ({}): {}".format(key,
-                                                                                  input_info[key].input_data.precision,
-                                                                                  input_info[key].input_data.layout,
+                                                                                  info.precision,
+                                                                                  info.layout,
                                                                                  " ".join(str(x) for x in
-                                                                                           input_info[key].input_data.shape)))
+                                                                                           info.shape)))

    images_count = len(input_image_sizes.keys())
-    binaries_count = len(input_info) - images_count
+    binaries_count = len(app_input_info) - images_count

    image_files = list()
    binary_files = list()
@ -100,33 +88,34 @@ def get_inputs(paths_to_input, batch_size, input_info, requests):
    for request_id in range(0, len(requests)):
        logger.info("Infer Request {} filling".format(request_id))
        input_data = {}
-        keys = list(sorted(input_info.keys()))
+        keys = list(sorted(app_input_info.keys()))
        for key in keys:
-            if is_image(input_info[key].input_data):
+            info = app_input_info[key]
+            if info.is_image:
                # input is image
                if len(image_files) > 0:
                    input_data[key] = fill_blob_with_image(image_files, request_id, batch_size, keys.index(key),
-                                                           len(keys), input_info[key].input_data)
+                                                           len(keys), info)
                    continue

            # input is binary
            if len(binary_files):
                input_data[key] = fill_blob_with_binary(binary_files, request_id, batch_size, keys.index(key),
-                                                        len(keys), input_info[key].input_data)
+                                                        len(keys), info)
                continue

            # most likely input is image info
-            if is_image_info(input_info[key].input_data) and len(input_image_sizes) == 1:
+            if info.is_image_info and len(input_image_sizes) == 1:
                image_size = input_image_sizes[list(input_image_sizes.keys()).pop()]
                logger.info("Fill input '" + key + "' with image size " + str(image_size[0]) + "x" +
                            str(image_size[1]))
-                input_data[key] = fill_blob_with_image_info(image_size, input_info[key].input_data)
+                input_data[key] = fill_blob_with_image_info(image_size, info)
                continue

            # fill with random data
-            logger.info("Fill input '{}' with random values ({} is expected)".format(key, "image" if is_image(
-                input_info[key].input_data) else "some binary data"))
-            input_data[key] = fill_blob_with_random(input_info[key].input_data)
+            logger.info("Fill input '{}' with random values ({} is expected)".format(key, "image"
+                if info.is_image else "some binary data"))
+            input_data[key] = fill_blob_with_random(info)

        requests_input_data.append(input_data)

@ -150,8 +139,8 @@ def get_files_by_extensions(paths_to_input, extensions):

    return input_files

-def fill_blob_with_image(image_paths, request_id, batch_size, input_id, input_size, layer):
-    shape = layer.shape
+def fill_blob_with_image(image_paths, request_id, batch_size, input_id, input_size, info):
+    shape = info.shape
    images = np.ndarray(shape)
    image_index = request_id * batch_size * input_size + input_id
    for b in range(batch_size):
@ -159,15 +148,11 @@ def fill_blob_with_image(image_paths, request_id, batch_size, input_id, input_si
        image_filename = image_paths[image_index]
        logger.info('Prepare image {}'.format(image_filename))
        image = cv2.imread(image_filename)
-
-        new_im_size = tuple(shape[2:])
+        new_im_size = tuple((info.width, info.height))
        if image.shape[:-1] != new_im_size:
            logger.warning("Image is resized from ({}) to ({})".format(image.shape[:-1], new_im_size))
            image = cv2.resize(image, new_im_size)
-
-        if image.shape[0] != shape[2]:
-            image = image.transpose((2, 1, 0))
-        else:
+        if info.layout in ['NCHW', 'CHW']:
            image = image.transpose((2, 0, 1))
        images[b] = image

@ -189,11 +174,13 @@ def get_dtype(precision):
        return format_map[precision]
    raise Exception("Can't find data type for precision: " + precision)

-def fill_blob_with_binary(binary_paths, request_id, batch_size, input_id, input_size, layer):
-    binaries = np.ndarray(layer.shape)
-    shape = get_blob_shape(layer, 1) # get blob shape for batch 1
+def fill_blob_with_binary(binary_paths, request_id, batch_size, input_id, input_size, info):
+    binaries = np.ndarray(info.shape)
+    shape = info.shape.copy()
+    if 'N' in info.layout:
+        shape[info.layout.index('N')] = 1
    binary_index = request_id * batch_size * input_size + input_id
-    dtype = get_dtype(layer.precision)
+    dtype = get_dtype(info.precision)
    for b in range(batch_size):
        binary_index %= len(binary_paths)
        binary_filename = binary_paths[binary_index]
--- a/tools/benchmark/utils/utils.py
+++ b/tools/benchmark/utils/utils.py
@ -1,5 +1,5 @@
 """
- Copyright (C) 2018-2020 Intel Corporation
+ Copyright (C) 2018-2021 Intel Corporation

 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@ -17,7 +17,6 @@ from openvino.inference_engine import IENetwork,IECore

 from .constants import DEVICE_DURATION_IN_SECS, UNKNOWN_DEVICE_TYPE, \
    CPU_DEVICE_NAME, GPU_DEVICE_NAME
-from .inputs_filling import is_image
 from .logging import logger

 import json
@ -61,13 +60,13 @@ def next_step(additional_info='', step_id=0):
    print(step_info_template)


-def config_network_inputs(ie_network: IENetwork):
+def config_network_inputs(ie_network: IENetwork, app_inputs_info):
    input_info = ie_network.input_info
-
    for key in input_info.keys():
-        if is_image(input_info[key].input_data):
+        if app_inputs_info[key].is_image:
            # Set the precision of input data provided by the user
            # Should be called before load of the network to the plugin
+            app_inputs_info[key].precision = 'U8'
            input_info[key].precision = 'U8'


@ -227,33 +226,105 @@ def get_command_line_arguments(argv):
        parameters.append((arg_name, arg_value))
    return parameters

-def update_shapes(shapes, shapes_string: str, inputs_info):
-    updated = False
-    matches = re.findall(r'(.*?)\[(.*?)\],?', shapes_string)
+def parse_input_parameters(parameter_string, input_info):
+    # Parse parameter string like "input0[value0],input1[value1]" or "[value]" (applied to all inputs)
+    return_value = {}
+    if parameter_string:
+        matches = re.findall(r'(.*?)\[(.*?)\],?', parameter_string)
        if matches:
            for match in matches:
-            input_name = match[0]
-            parsed_shape = [int(dim) for dim in match[1].split(',')]
+                input_name, value = match
                if input_name != '':
-                shapes[input_name] = parsed_shape
-                updated = True
+                    return_value[input_name] = value
                else:
-                shapes.update({ k:parsed_shape for k in shapes.keys() })
-                updated = True
+                    return_value  = { k:value for k in input_info.keys() }
                    break
        else:
-        raise Exception("Can't parse `shape` parameter: {}".format(shapes_string))
-    return updated
+            raise Exception("Can't parse input parameter: {}".format(parameter_string))
+    return return_value

-def adjust_shapes_batch(shapes, batch_size: int, inputs_info):
-    updated = False
-    for name, data in inputs_info.items():
-        layout = data.input_data.layout
-        batch_index = layout.index('N') if 'N' in layout else -1
-        if batch_index != -1 and shapes[name][batch_index] != batch_size:
-            shapes[name][batch_index] = batch_size
-            updated = True
-    return updated
+class InputInfo:
+    def __init__(self):
+        self.precision = None
+        self.layout = ""
+        self.shape = []
+
+    @property
+    def is_image(self):
+        if self.layout not in [ "NCHW", "NHWC", "CHW", "HWC" ]:
+            return False
+        return self.channels == 3
+
+    @property
+    def is_image_info(self):
+        if self.layout != "NC":
+            return False
+        return self.channels >= 2
+
+    def getDimentionByLayout(self, character):
+        if character not in self.layout:
+            raise Exception("Error: Can't get {} from layout {}".format(character, self.layout))
+        return self.shape[self.layout.index(character)]
+
+    @property
+    def width(self):
+        return self.getDimentionByLayout("W")
+
+    @property
+    def height(self):
+        return self.getDimentionByLayout("H")
+
+    @property
+    def channels(self):
+        return self.getDimentionByLayout("C")
+
+    @property
+    def batch(self):
+        return self.getDimentionByLayout("N")
+
+    @property
+    def depth(self):
+        return self.getDimentionByLayout("D")
+
+def get_inputs_info(shape_string, layout_string, batch_size, input_info):
+    shape_map = parse_input_parameters(shape_string, input_info)
+    layout_map = parse_input_parameters(layout_string, input_info)
+    reshape = False
+    info_map = {}
+    for name, descriptor in input_info.items():
+        info = InputInfo()
+        # Precision
+        info.precision = descriptor.precision
+        # Shape
+        if name in shape_map.keys():
+            parsed_shape = [int(dim) for dim in shape_map[name].split(',')]
+            info.shape = parsed_shape
+            reshape = True
+        else:
+            info.shape = descriptor.input_data.shape
+        # Layout
+        info.layout = layout_map[name].upper() if name in layout_map.keys() else descriptor.tensor_desc.layout
+        # Update shape with batch if needed
+        if batch_size != 0:
+            batch_index = info.layout.index('N') if 'N' in info.layout else -1
+            if batch_index != -1 and info.shape[batch_index] != batch_size:
+                info.shape[batch_index] = batch_size
+                reshape = True
+        info_map[name] = info
+    return info_map, reshape
+
+def get_batch_size(inputs_info):
+    batch_size = 0
+    for _, info in inputs_info.items():
+        batch_index = info.layout.index('N') if 'N' in info.layout else -1
+        if batch_index != -1:
+            if batch_size == 0:
+                batch_size = info.shape[batch_index]
+            elif batch_size != info.shape[batch_index]:
+                raise Exception("Can't deterimine batch size: batch is different for different inputs!")
+    if batch_size == 0:
+        batch_size = 1
+    return batch_size

 def show_available_devices():
    ie = IECore()