remove opencv dependecies in samples (#8123)

* remove opencv dependecies ins samples * fixed output
2021-11-16 14:13:16 +03:00 · 2021-11-16 14:13:16 +03:00 · 5512c36358
commit 5512c36358
parent 46fea0fe48
9 changed files with 201 additions and 118 deletions
--- a/inference-engine/samples/benchmark_app/CMakeLists.txt
+++ b/inference-engine/samples/benchmark_app/CMakeLists.txt
@ -4,6 +4,10 @@

 set(TARGET_NAME "benchmark_app")

+if(ENABLE_OPENCV)
+    set(OPENCV_MODULES core)
+endif()
+
 file (GLOB SRC ${CMAKE_CURRENT_SOURCE_DIR}/*.cpp)
 file (GLOB HDR ${CMAKE_CURRENT_SOURCE_DIR}/*.hpp)

@ -11,7 +15,7 @@ ie_add_sample(NAME ${TARGET_NAME}
              SOURCES ${SRC}
              HEADERS ${HDR}
              DEPENDENCIES format_reader ie_samples_utils
-              OPENCV_DEPENDENCIES core)
+              OPENCV_DEPENDENCIES ${OPENCV_MODULES})

 find_package(OpenCL)

--- a/inference-engine/samples/common/utils/include/samples/args_helper.hpp
+++ b/inference-engine/samples/common/utils/include/samples/args_helper.hpp
@ -38,3 +38,4 @@ void processLayout(InferenceEngine::CNNNetwork& network,
                   const std::string& iol);

 void printInputAndOutputsInfo(const InferenceEngine::CNNNetwork& network);
+void printInputAndOutputsInfo(const ov::Function& network);
--- a/inference-engine/samples/common/utils/include/samples/common.hpp
+++ b/inference-engine/samples/common/utils/include/samples/common.hpp
@ -33,6 +33,36 @@
 #    endif
 #endif

+/**
+ * @brief Unicode string wrappers
+ */
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+#    define tchar                wchar_t
+#    define tstring              std::wstring
+#    define tmain                wmain
+#    define TSTRING2STRING(tstr) wstring2string(tstr)
+#else
+#    define tchar                char
+#    define tstring              std::string
+#    define tmain                main
+#    define TSTRING2STRING(tstr) tstr
+#endif
+
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+
+/**
+ * @brief Convert wstring to string
+ * @param ref on wstring
+ * @return string
+ */
+inline std::string wstring2string(const std::wstring& wstr) {
+    std::string str;
+    for (auto&& wc : wstr)
+        str += static_cast<char>(wc);
+    return str;
+}
+#endif
+
 /**
 * @brief trim from start (in place)
 * @param s - string to trim
--- a/inference-engine/samples/common/utils/src/args_helper.cpp
+++ b/inference-engine/samples/common/utils/src/args_helper.cpp
@ -326,3 +326,35 @@ void printInputAndOutputsInfo(const InferenceEngine::CNNNetwork& network) {
                  << layer.second->getLayout() << std::endl;
    }
 }
+
+void printInputAndOutputsInfo(const ov::Function& network) {
+    slog::info << "model name: " << network.get_friendly_name() << slog::endl;
+
+    const std::vector<ov::Output<const ov::Node>> inputs = network.inputs();
+    for (const ov::Output<const ov::Node> input : inputs) {
+        slog::info << "    inputs" << slog::endl;
+
+        const std::string name = input.get_names().empty() ? "NONE" : input.get_any_name();
+        slog::info << "        input name: " << name << slog::endl;
+
+        const ov::element::Type type = input.get_element_type();
+        slog::info << "        input type: " << type << slog::endl;
+
+        const ov::Shape shape = input.get_shape();
+        slog::info << "        input shape: " << shape << slog::endl;
+    }
+
+    const std::vector<ov::Output<const ov::Node>> outputs = network.outputs();
+    for (const ov::Output<const ov::Node> output : outputs) {
+        slog::info << "    outputs" << slog::endl;
+
+        const std::string name = output.get_names().empty() ? "NONE" : output.get_any_name();
+        slog::info << "        output name: " << name << slog::endl;
+
+        const ov::element::Type type = output.get_element_type();
+        slog::info << "        output type: " << type << slog::endl;
+
+        const ov::Shape shape = output.get_shape();
+        slog::info << "        output shape: " << shape << slog::endl;
+    }
+}
--- a/inference-engine/samples/hello_classification/CMakeLists.txt
+++ b/inference-engine/samples/hello_classification/CMakeLists.txt
@ -4,6 +4,5 @@

 ie_add_sample(NAME hello_classification
              SOURCES "${CMAKE_CURRENT_SOURCE_DIR}/main.cpp"
-              DEPENDENCIES ie_samples_utils
-              OPENCV_DEPENDENCIES core imgcodecs)
+              DEPENDENCIES format_reader ie_samples_utils)

--- a/inference-engine/samples/hello_classification/main.cpp
+++ b/inference-engine/samples/hello_classification/main.cpp
@ -4,119 +4,72 @@

 #include <iterator>
 #include <memory>
-#include <samples/slog.hpp>
 #include <string>
 #include <vector>

-#include "openvino/core/layout.hpp"
+// clang-format off
 #include "openvino/openvino.hpp"
-#include "samples/classification_results.h"
+
+#include "samples/args_helper.hpp"
 #include "samples/common.hpp"
-#include "samples/ocv_common.hpp"
+#include "samples/classification_results.h"
+#include "samples/slog.hpp"
+#include "format_reader_ptr.h"
+// clang-format on

 using namespace ov::preprocess;

-/**
- * @brief Define names based depends on Unicode path support
- */
-#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-#    define tcout                  std::wcout
-#    define file_name_t            std::wstring
-#    define imread_t               imreadW
-#    define ClassificationResult_t ClassificationResultW
-#else
-#    define tcout                  std::cout
-#    define file_name_t            std::string
-#    define imread_t               cv::imread
-#    define ClassificationResult_t ClassificationResult
-#endif
-
-#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-/**
- * @brief Realization cv::imread with support Unicode paths
- */
-cv::Mat imreadW(std::wstring input_image_path) {
-    cv::Mat image;
-    std::ifstream input_image_stream;
-    input_image_stream.open(input_image_path.c_str(), std::iostream::binary | std::ios_base::ate | std::ios_base::in);
-    if (input_image_stream.is_open()) {
-        if (input_image_stream.good()) {
-            input_image_stream.seekg(0, std::ios::end);
-            std::size_t file_size = input_image_stream.tellg();
-            input_image_stream.seekg(0, std::ios::beg);
-            std::vector<char> buffer(0);
-            std::copy(std::istreambuf_iterator<char>(input_image_stream),
-                      std::istreambuf_iterator<char>(),
-                      std::back_inserter(buffer));
-            image = cv::imdecode(cv::Mat(1, file_size, CV_8UC1, &buffer[0]), cv::IMREAD_COLOR);
-        } else {
-            tcout << "Input file '" << input_image_path << "' processing error" << std::endl;
-        }
-        input_image_stream.close();
-    } else {
-        tcout << "Unable to read input file '" << input_image_path << "'" << std::endl;
-    }
-    return image;
-}
-
-/**
- * @brief Convert wstring to string
- * @param ref on wstring
- * @return string
- */
-std::string simpleConvert(const std::wstring& wstr) {
-    std::string str;
-    for (auto&& wc : wstr)
-        str += static_cast<char>(wc);
-    return str;
-}
-
 /**
 * @brief Main with support Unicode paths, wide strings
 */
-int wmain(int argc, wchar_t* argv[]) {
-#else
-
-int main(int argc, char* argv[]) {
-#endif
+int tmain(int argc, tchar* argv[]) {
    try {
-        // -------- Get OpenVINO Runtime version --------
-        slog::info << "OpenVINO runtime: " << ov::get_openvino_version() << slog::endl;
+        // -------- Get OpenVINO runtime version --------
+        slog::info << ov::get_openvino_version() << slog::endl;

        // -------- Parsing and validation of input arguments --------
        if (argc != 4) {
-            tcout << "Usage : " << argv[0] << " <path_to_model> <path_to_image> <device_name>" << std::endl;
+            slog::info << "Usage : " << argc << " <path_to_model> <path_to_image> <device_name>" << slog::endl;
            return EXIT_FAILURE;
        }

-        const file_name_t input_model{argv[1]};
-        const file_name_t input_image_path{argv[2]};
-#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-        const std::string device_name = simpleConvert(argv[3]);
-#else
-        const std::string device_name{argv[3]};
-#endif
+        const std::string args = TSTRING2STRING(argv[0]);
+        const std::string model_path = TSTRING2STRING(argv[1]);
+        const std::string image_path = TSTRING2STRING(argv[2]);
+        const std::string device_name = TSTRING2STRING(argv[3]);

        // -------- Step 1. Initialize OpenVINO Runtime Core --------
        ov::runtime::Core core;

        // -------- Step 2. Read a model --------
-        auto model = core.read_model(input_model);
+        slog::info << "Loading model files: " << model_path << slog::endl;
+        auto model = core.read_model(model_path);
+        printInputAndOutputsInfo(*model);

        OPENVINO_ASSERT(model->get_parameters().size() == 1, "Sample supports models with 1 input only");
        OPENVINO_ASSERT(model->get_results().size() == 1, "Sample supports models with 1 output only");

-        // -------- Step 3. Initialize inference engine core
+        // -------- Step 3. Set up input

        // Read input image to a tensor and set it to an infer request
        // without resize and layout conversions
-        cv::Mat image = imread_t(input_image_path);
-        // just wrap Mat data by ov::runtime::Tensor without allocating of new memory
-        ov::runtime::Tensor input_tensor = wrapMat2Tensor(image);
+        FormatReader::ReaderPtr reader(image_path.c_str());
+        if (reader.get() == nullptr) {
+            slog::warn << "Image " + image_path + " cannot be read!" << slog::endl;
+            throw std::logic_error("");
+        }
+
+        ov::element::Type input_type = ov::element::u8;
+        ov::Shape input_shape = {1, reader->height(), reader->width(), 3};
+        std::shared_ptr<unsigned char> input_data = reader->getData();
+
+        // just wrap image data by ov::runtime::Tensor without allocating of new memory
+        ov::runtime::Tensor input_tensor = ov::runtime::Tensor(input_type, input_shape, input_data.get());
+
        const ov::Shape tensor_shape = input_tensor.get_shape();
+        const ov::Layout tensor_layout{"NHWC"};

        // -------- Step 4. Apply preprocessing --------
-        const ov::Layout tensor_layout{"NHWC"};

        // clang-format off
        model = PrePostProcessor().
@ -147,8 +100,8 @@ int main(int argc, char* argv[]) {
                // - precision of tensor is supposed to be 'f32'
                tensor(OutputTensorInfo().
                    set_element_type(ov::element::f32))).
-        // 6) Apply preprocessing modifing the original 'model'
-        build(model);
+            // 6) Apply preprocessing modifing the original 'model'
+            build(model);
        // clang-format on

        // -------- Step 5. Loading a model to the device --------
@ -165,18 +118,16 @@ int main(int argc, char* argv[]) {
        infer_request.infer();

        // -------- Step 9. Process output
-        ov::runtime::Tensor output_tensor = infer_request.get_output_tensor();
+        const ov::runtime::Tensor& output_tensor = infer_request.get_output_tensor();

        // Print classification results
-        ClassificationResult_t classification_result(output_tensor, {input_image_path});
+        ClassificationResult classification_result(output_tensor, {image_path});
        classification_result.show();
        // -----------------------------------------------------------------------------------------------------
    } catch (const std::exception& ex) {
        std::cerr << ex.what() << std::endl;
        return EXIT_FAILURE;
    }
-    std::cout << "This sample is an API example, for any performance measurements "
-                 "please use the dedicated benchmark_app tool"
-              << std::endl;
+
    return EXIT_SUCCESS;
 }
--- a/inference-engine/samples/hello_reshape_ssd/CMakeLists.txt
+++ b/inference-engine/samples/hello_reshape_ssd/CMakeLists.txt
@ -5,5 +5,4 @@
 ie_add_sample(NAME hello_reshape_ssd
              SOURCES "${CMAKE_CURRENT_SOURCE_DIR}/main.cpp"
              HEADERS "${CMAKE_CURRENT_SOURCE_DIR}/reshape_ssd_extension.hpp"
-              DEPENDENCIES ie_samples_utils
-              OPENCV_DEPENDENCIES core imgproc imgcodecs)
+              DEPENDENCIES format_reader ie_samples_utils)
--- a/inference-engine/samples/hello_reshape_ssd/main.cpp
+++ b/inference-engine/samples/hello_reshape_ssd/main.cpp
@ -2,10 +2,12 @@
 // SPDX-License-Identifier: Apache-2.0
 //

+#include <format_reader_ptr.h>
+
 #include <inference_engine.hpp>
 #include <memory>
 #include <ngraph/ngraph.hpp>
-#include <samples/ocv_common.hpp>
+#include <samples/common.hpp>
 #include <string>
 #include <vector>

@ -54,12 +56,19 @@ int main(int argc, char* argv[]) {
        std::string input_name;
        SizeVector input_shape;
        std::tie(input_name, input_shape) = *input_shapes.begin();
-        cv::Mat image = cv::imread(input_image_path);
+        FormatReader::ReaderPtr reader(input_image_path.c_str());
+        if (reader.get() == nullptr) {
+            std::cout << "Image " + input_image_path + " cannot be read!" << std::endl;
+            return 1;
+        }
+        size_t image_width, image_height;
+        image_width = reader->width();
+        image_height = reader->height();
        input_shape[0] = batch_size;
-        input_shape[2] = static_cast<size_t>(image.rows);
-        input_shape[3] = static_cast<size_t>(image.cols);
+        input_shape[2] = image_height;
+        input_shape[3] = image_width;
        input_shapes[input_name] = input_shape;
-        std::cout << "Resizing network to the image size = [" << image.rows << "x" << image.cols << "] "
+        std::cout << "Resizing network to the image size = [" << image_height << "x" << image_width << "] "
                  << "with batch = " << batch_size << std::endl;
        network.reshape(input_shapes);
        // -----------------------------------------------------------------------------------------------------
@ -132,10 +141,51 @@ int main(int argc, char* argv[]) {

        // --------------------------- Step 6. Prepare input
        // --------------------------------------------------------
-        Blob::Ptr input = infer_request.GetBlob(input_name);
-        for (size_t b = 0; b < batch_size; b++) {
-            matU8ToBlob<uint8_t>(image, input, b);
+        /** Collect images data ptrs **/
+        std::shared_ptr<unsigned char> image_data, original_image_data;
+        /** Store image data **/
+        std::shared_ptr<unsigned char> original_data(reader->getData());
+        std::shared_ptr<unsigned char> data_reader(
+            reader->getData(input_info->getTensorDesc().getDims()[3], input_info->getTensorDesc().getDims()[2]));
+        if (data_reader.get() != nullptr) {
+            original_image_data = original_data;
+            image_data = data_reader;
+        } else {
+            throw std::logic_error("Valid input images were not found!");
        }
+
+        /** Creating input blob **/
+        Blob::Ptr image_input = infer_request.GetBlob(input_name);
+
+        /** Filling input tensor with images. First b channel, then g and r channels **/
+        MemoryBlob::Ptr mimage = as<MemoryBlob>(image_input);
+        if (!mimage) {
+            std::cout << "We expect image blob to be inherited from MemoryBlob, but by fact we were not able "
+                         "to cast imageInput to MemoryBlob"
+                      << std::endl;
+            return 1;
+        }
+        // locked memory holder should be alive all time while access to its buffer happens
+        auto minputHolder = mimage->wmap();
+
+        size_t num_channels = mimage->getTensorDesc().getDims()[1];
+        size_t image_size = mimage->getTensorDesc().getDims()[3] * mimage->getTensorDesc().getDims()[2];
+
+        unsigned char* data = minputHolder.as<unsigned char*>();
+
+        /** Iterate over all input images **/
+        for (size_t image_id = 0; image_id < batch_size; ++image_id) {
+            /** Iterate over all pixel in image (b,g,r) **/
+            for (size_t pid = 0; pid < image_size; pid++) {
+                /** Iterate over all channels **/
+                for (size_t ch = 0; ch < num_channels; ++ch) {
+                    /**          [images stride + channels stride + pixel id ] all in bytes            **/
+                    data[image_id * image_size * num_channels + ch * image_size + pid] =
+                        image_data.get()[pid * num_channels + ch];
+                }
+            }
+        }
+
        // -----------------------------------------------------------------------------------------------------

        // --------------------------- Step 7. Do inference
@ -156,37 +206,51 @@ int main(int argc, char* argv[]) {
        auto moutputHolder = moutput->rmap();
        const float* detection = moutputHolder.as<const float*>();

+        std::vector<std::vector<int>> boxes(batch_size);
+        std::vector<std::vector<int>> classes(batch_size);
+
        /* Each detection has image_id that denotes processed image */
        for (size_t cur_proposal = 0; cur_proposal < max_proposal_count; cur_proposal++) {
-            float image_id = detection[cur_proposal * object_size + 0];
-            float label = detection[cur_proposal * object_size + 1];
-            float confidence = detection[cur_proposal * object_size + 2];
-            /* CPU and GPU devices have difference in DetectionOutput layer, so we
-             * need both checks */
-            if (image_id < 0 || confidence == 0.0f) {
-                continue;
+            auto image_id = static_cast<int>(detection[cur_proposal * object_size + 0]);
+            if (image_id < 0) {
+                break;
            }

-            float xmin = detection[cur_proposal * object_size + 3] * image.cols;
-            float ymin = detection[cur_proposal * object_size + 4] * image.rows;
-            float xmax = detection[cur_proposal * object_size + 5] * image.cols;
-            float ymax = detection[cur_proposal * object_size + 6] * image.rows;
+            float confidence = detection[cur_proposal * object_size + 2];
+            auto label = static_cast<int>(detection[cur_proposal * object_size + 1]);
+            auto xmin = detection[cur_proposal * object_size + 3] * image_width;
+            auto ymin = detection[cur_proposal * object_size + 4] * image_height;
+            auto xmax = detection[cur_proposal * object_size + 5] * image_width;
+            auto ymax = detection[cur_proposal * object_size + 6] * image_height;

            if (confidence > 0.5f) {
                /** Drawing only objects with >50% probability **/
-                std::ostringstream conf;
-                conf << ":" << std::fixed << std::setprecision(3) << confidence;
-                cv::rectangle(image, cv::Point2f(xmin, ymin), cv::Point2f(xmax, ymax), cv::Scalar(0, 0, 255));
+                classes[image_id].push_back(label);
+                boxes[image_id].push_back(static_cast<int>(xmin));
+                boxes[image_id].push_back(static_cast<int>(ymin));
+                boxes[image_id].push_back(static_cast<int>(xmax - xmin));
+                boxes[image_id].push_back(static_cast<int>(ymax - ymin));
+
                std::cout << "[" << cur_proposal << "," << label << "] element, prob = " << confidence << ", bbox = ("
                          << xmin << "," << ymin << ")-(" << xmax << "," << ymax << ")"
                          << ", batch id = " << image_id << std::endl;
            }
        }

-        cv::imwrite("hello_reshape_ssd_output.jpg", image);
-        std::cout << "The resulting image was saved in the file: "
-                     "hello_reshape_ssd_output.jpg"
-                  << std::endl;
+        for (size_t batch_id = 0; batch_id < batch_size; ++batch_id) {
+            addRectangles(original_image_data.get(),
+                          image_height,
+                          image_width,
+                          boxes[batch_id],
+                          classes[batch_id],
+                          BBOX_THICKNESS);
+            const std::string image_path = "hello_reshape_ssd_output.bmp";
+            if (writeOutputBmp(image_path, original_image_data.get(), image_height, image_width)) {
+                std::cout << "The resulting image was saved in the file: " + image_path << std::endl;
+            } else {
+                throw std::logic_error(std::string("Can't create a file: ") + image_path);
+            }
+        }
        // -----------------------------------------------------------------------------------------------------
    } catch (const std::exception& ex) {
        std::cerr << ex.what() << std::endl;
--- a/inference-engine/samples/hello_reshape_ssd/reshape_ssd_extension.hpp
+++ b/inference-engine/samples/hello_reshape_ssd/reshape_ssd_extension.hpp
@ -12,6 +12,9 @@

 #define CUSTOM_RELU_TYPE "CustomReLU"

+/* thickness of a line (in pixels) to be used for bounding boxes */
+#define BBOX_THICKNESS 2
+
 class CustomReLUImpl : public InferenceEngine::ILayerExecImpl {
 public:
    explicit CustomReLUImpl(const std::shared_ptr<ngraph::Node>& node) : _node(node) {}