diff --git a/.ci/azure/linux_onnxruntime.yml b/.ci/azure/linux_onnxruntime.yml
index ad5e630820d..4fd14f2c1b1 100644
--- a/.ci/azure/linux_onnxruntime.yml
+++ b/.ci/azure/linux_onnxruntime.yml
@@ -94,7 +94,7 @@ jobs:
         -DENABLE_PROFILING_ITT=OFF
         -DENABLE_SAMPLES=OFF
         -DNGRAPH_ONNX_FRONTEND_ENABLE=ON
-        -DNGRAPH_DEBUG_ENABLE=OFF
+        -DOPENVINO_DEBUG_ENABLE=OFF
         $(REPO_DIR)
       workingDirectory: $(BUILD_DIR)
 
diff --git a/.ci/azure/windows.yml b/.ci/azure/windows.yml
index 62e0fa7c712..81c1ba95601 100644
--- a/.ci/azure/windows.yml
+++ b/.ci/azure/windows.yml
@@ -16,7 +16,7 @@ jobs:
   timeoutInMinutes: 120
 
   pool:
-    name: WIN_VMSS_VENV_F8S_WU2
+    name: WIN_VMSS_VENV_F16S_WU2
 
   variables:
     system.debug: true
@@ -34,8 +34,6 @@ jobs:
     INSTALL_DIR: $(WORK_DIR)\install_pkg
     INSTALL_TEST_DIR: $(INSTALL_DIR)\tests
     SETUPVARS: $(INSTALL_DIR)\setupvars.bat
-    IB_DIR: C:\Program Files (x86)\IncrediBuild
-    IB_TESTCONSOLE: $(IB_DIR)\IBTestConsole.exe
 
   steps:
   - script: |
@@ -59,12 +57,6 @@ jobs:
       rd /Q /S $(BUILD_SAMPLES_DIR) & mkdir $(BUILD_SAMPLES_DIR)
     displayName: 'Make dir'
 
-  - script: |
-      certutil -urlcache -split -f https://openvinoweb.z5.web.core.windows.net/incredibuild/install_ib_console.bat install_ib_console.bat
-      call install_ib_console.bat
-    workingDirectory: $(WORK_DIR)
-    displayName: 'Install IncrediBuild'
-
   - checkout: self
     clean: true
     lfs: false
@@ -109,9 +101,7 @@ jobs:
   - script: dir $(REPO_DIR)\inference-engine\temp\ /s
     displayName: 'List temp SDKs'
 
-  - script: |
-      set PATH=$(WORK_DIR)\ninja-win;%PATH%
-      call "$(MSVS_VARS_PATH)" && "C:\Program Files (x86)\IncrediBuild\BuildConsole.exe" /COMMAND="ninja"
+  - script: call "$(MSVS_VARS_PATH)" && $(WORK_DIR)\ninja-win\ninja
     workingDirectory: $(BUILD_DIR)
     displayName: 'Build Win'
 
@@ -153,10 +143,8 @@ jobs:
     displayName: 'PaddlePaddle Frontend UT'
     continueOnError: false
 
-  - script: |
-      set PATH=$(IB_DIR);%PATH%
-      call $(SETUPVARS) && "$(IB_TESTCONSOLE)" $(INSTALL_TEST_DIR)\InferenceEngineUnitTests.exe --gtest_output=xml:TEST-InferenceEngineUnitTests-IB.xml
-    displayName: 'IE UT old - IB'
+  - script: call $(SETUPVARS) && $(INSTALL_TEST_DIR)\InferenceEngineUnitTests.exe --gtest_output=xml:TEST-InferenceEngineUnitTests.xml
+    displayName: 'IE UT old'
     continueOnError: false
 
   - script: call $(SETUPVARS) && $(INSTALL_TEST_DIR)\ieUnitTests --gtest_output=xml:TEST-ieUnitTests.xml
@@ -187,11 +175,8 @@ jobs:
     displayName: 'TEMPLATE FuncTests'
     continueOnError: false
 
-    # call $(SETUPVARS) && $(INSTALL_TEST_DIR)\cpuFuncTests.exe --gtest_filter=*smoke* --gtest_output=xml:TEST-cpuFuncTests.xml
-  - script: |
-      set PATH=$(IB_DIR);%PATH%
-      call $(SETUPVARS) && "$(IB_TESTCONSOLE)" $(INSTALL_TEST_DIR)\cpuFuncTests.exe --gtest_filter=*smoke*:-*CompareWithRefs/base_size=16_pre_nms_topn=100_post_nms_topn=100_nms_thresh=0.7_feat_stride=1_min_size=1_ratio*:*smoke_GRUSequenceCommonZeroClip/GRUSequenceTest.CompareWithRefs/mode=CONVERT_TO_TI_MAX_SEQ_LEN_CONST_seq_lengths* --gtest_output=xml:TEST-cpuFuncTests-IB.xml /testlevel=24
-    displayName: 'CPU FuncTests - IB'
+  - script: $(SETUPVARS) && $(INSTALL_TEST_DIR)\cpuFuncTests.exe --gtest_filter=*smoke* --gtest_output=xml:TEST-cpuFuncTests.xml
+    displayName: 'CPU FuncTests'
     continueOnError: false
 
   - script: |
@@ -213,8 +198,3 @@ jobs:
       buildPlatform: 'x64' # Optional
       buildConfiguration: 'Windows' # Optional
       #publishRunAttachments: true # Optional
-
-  - script: echo Stop IncrediBuild_Agent && net stop IncrediBuild_Agent
-    displayName: Stop IncrediBuild
-    continueOnError: true
-    enabled: false
diff --git a/.ci/openvino-onnx/Dockerfile b/.ci/openvino-onnx/Dockerfile
index 8e2365e4ebc..ada3c36adb1 100644
--- a/.ci/openvino-onnx/Dockerfile
+++ b/.ci/openvino-onnx/Dockerfile
@@ -68,7 +68,7 @@ RUN cmake .. \
     -DENABLE_PYTHON=ON \
     -DPYTHON_EXECUTABLE=/usr/bin/python3 \
     -DNGRAPH_ONNX_FRONTEND_ENABLE=ON \
-    -DNGRAPH_DEBUG_ENABLE=OFF \
+    -DOPENVINO_DEBUG_ENABLE=OFF \
     -DCMAKE_INSTALL_PREFIX=/openvino/dist \
     -DNGRAPH_USE_PROTOBUF_LITE=${PROTOBUF_LITE}
 RUN make -j $(nproc) install
diff --git a/.ci/openvino-onnx/watchdog/src/watchdog.py b/.ci/openvino-onnx/watchdog/src/watchdog.py
index 9c695ef22be..3edbe478683 100644
--- a/.ci/openvino-onnx/watchdog/src/watchdog.py
+++ b/.ci/openvino-onnx/watchdog/src/watchdog.py
@@ -486,7 +486,7 @@ class Watchdog:
             self._queue_message(message, message_severity='warning', pr=pr)
         elif build_delta > _BUILD_DURATION_THRESHOLD:
             # CI job take too long, possibly froze - communicate failure
-            message = ('ONNX CI job build #{}, for PR #{} started,'
+            message = ('ONNX CI job build #{}, for PR #{} started, '
                        'but did not finish in designated time of {} '
                        'minutes!'.format(build_number, pr_number,
                                          str(_BUILD_DURATION_THRESHOLD.seconds / 60)))
diff --git a/.gitmodules b/.gitmodules
index 8569ecbb958..ce94901db10 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -53,3 +53,6 @@
 [submodule "ncc"]
 	path = cmake/developer_package/ncc_naming_style/ncc
 	url = https://github.com/nithinn/ncc.git
+[submodule "thirdparty/onednn_gpu"]
+	path = thirdparty/onednn_gpu
+	url = https://github.com/oneapi-src/oneDNN.git
diff --git a/cmake/dependencies.cmake b/cmake/dependencies.cmake
index b4946d85d11..70562b8cc96 100644
--- a/cmake/dependencies.cmake
+++ b/cmake/dependencies.cmake
@@ -83,7 +83,6 @@ if(THREADING STREQUAL "OMP")
         message(FATAL_ERROR "Intel OMP is not available on current platform")
     endif()
     update_deps_cache(OMP "${OMP}" "Path to OMP root folder")
-    log_rpath_from_dir(OMP "${OMP}/lib")
     debug_message(STATUS "intel_omp=" ${OMP})
     
     ie_cpack_add_component(omp REQUIRED)
@@ -146,12 +145,6 @@ if(THREADING STREQUAL "TBB" OR THREADING STREQUAL "TBB_AUTO")
     update_deps_cache(TBB_DIR "${TBB}/cmake" "Path to TBB cmake folder")
 
     update_deps_cache(TBBBIND_2_4_DIR "${TBBBIND_2_4}/cmake" "Path to TBBBIND_2_4 cmake folder")
-
-    if(WIN32)
-        log_rpath_from_dir(TBB "${TBB}/bin")
-    else ()
-        log_rpath_from_dir(TBB "${TBB}/lib")
-    endif()
     debug_message(STATUS "tbb=" ${TBB})
 endif()
 
@@ -242,14 +235,6 @@ if(ENABLE_OPENCV)
     endif()
 
     update_deps_cache(OpenCV_DIR "${ocv_cmake_path}" "Path to OpenCV package folder")
-
-    if(WIN32)
-        log_rpath_from_dir(OPENCV "${OpenCV_DIR}/../bin")
-    elseif(ANDROID)
-        log_rpath_from_dir(OPENCV "${OpenCV_DIR}/../../../lib")
-    else()
-        log_rpath_from_dir(OPENCV "${OpenCV_DIR}/../lib")
-    endif()
     debug_message(STATUS "opencv=" ${OPENCV})
 else()
     reset_deps_cache(OpenCV_DIR)
@@ -277,8 +262,8 @@ if(ENABLE_GNA)
             set(GNA_HASH "cc954e67525006bf8bd353a6682e38bf208f6d74e973e0fc292850e721f17452")
         endif()
         if(GNA_LIBRARY_VERSION STREQUAL "GNA2")
-            set(GNA_VERSION "02.00.00.1226")
-            set(GNA_HASH "d5450af15c993e264c25ac4591a7dab44722e10d15fca4f222a1b84429d4e5b6")
+            set(GNA_VERSION "03.00.00.1377")
+            set(GNA_HASH "d45fb48994d8c2803a16e88e29ae48851066325b97c1c6c4a5bf4f4573d55c65")
         endif()
 
         set(FILES_TO_EXTRACT_LIST gna_${GNA_VERSION}/include)
diff --git a/cmake/developer_package/debug.cmake b/cmake/developer_package/debug.cmake
index bb4538dfe02..e14f30b4c0f 100644
--- a/cmake/developer_package/debug.cmake
+++ b/cmake/developer_package/debug.cmake
@@ -15,59 +15,3 @@ function(clean_message type)
     message (FATAL_ERROR)
   endif()  
 endfunction()
-
-file(REMOVE ${CMAKE_BINARY_DIR}/ld_library_rpath_64.txt)
-
-# log relative path to shared library that has to be used in LD_LIBRARY_PATH
-function (log_rpath_remove_top component component_remove_top lib lib_remove_top)
-  
-  set(top_lib_dir ${${component}})
-  set(lib_dir ${lib})
-
-#  debug_message(STATUS "LIB-IN=${lib} ")
-#  debug_message(STATUS "TOPLIB-IN=${top_lib_dir} ")
-  get_filename_component(top_lib_dir "${${component}}" DIRECTORY)
-
-  if (${component_remove_top} AND ${component})
-  else()
-    get_filename_component(add_name "${${component}}" NAME)
-    set(top_lib_dir "${top_lib_dir}/${add_name}")
-  endif()
-  if (${lib_remove_top} AND lib)
-    get_filename_component(lib_dir ${lib} DIRECTORY)
-  endif()
-
-  string (REPLACE "//" "/" top_lib_dir "${top_lib_dir}")
-  string (REPLACE "//" "/" lib_dir "${lib_dir}")
-
-  string (REPLACE "\\\\" "/" top_lib_dir "${top_lib_dir}")
-  string (REPLACE "\\\\" "/" lib_dir "${lib_dir}")
-
-#  debug_message(STATUS "LIB-OUT=${lib_dir}")
-#  debug_message(STATUS "TOPLIB-OUT=${top_lib_dir}")
-
-  if (WIN32)
-    string (TOLOWER "${top_lib_dir}" top_lib_dir)
-    string (TOLOWER "${lib_dir}" lib_dir)
-  endif()
-
-  string (REPLACE "${top_lib_dir}" "" component_dir "${lib_dir}")
-
-  set(RPATH_INFO "${component}=${component_dir}")
-  debug_message(STATUS "LD_LIBRARY_RPATH: ${RPATH_INFO}")
-  file(APPEND ${CMAKE_BINARY_DIR}/ld_library_rpath_64.txt "${RPATH_INFO}\n")
-endfunction()
-
-function (log_rpath_from_dir component lib_dir)
-  log_rpath_remove_top("${component}" TRUE "${lib_dir}" FALSE)
-endfunction()
-
-function (log_rpath component lib_path)
-  log_rpath_remove_top(${component} TRUE ${lib_path} TRUE)
-endfunction()
-
-# Just wrapping of the original message() function to make this macro known during IE build.
-# This macro is redefined (with additional checks) within the InferenceEngineConfig.cmake file.
-macro(ext_message TRACE_LEVEL)
-    message(${TRACE_LEVEL} "${ARGN}")
-endmacro()
diff --git a/cmake/features.cmake b/cmake/features.cmake
index 450b0d255cc..7528b89d47d 100644
--- a/cmake/features.cmake
+++ b/cmake/features.cmake
@@ -122,7 +122,7 @@ endif()
 
 ie_dependent_option(NGRAPH_ONNX_FRONTEND_ENABLE "Enable ONNX FrontEnd" ON "protoc_available" OFF)
 ie_dependent_option(NGRAPH_PDPD_FRONTEND_ENABLE "Enable PaddlePaddle FrontEnd" ON "protoc_available" OFF)
-ie_option(IR_FRONTEND_ENABLE "Enable IR FrontEnd" ON)
+ie_option(NGRAPH_IR_FRONTEND_ENABLE "Enable IR FrontEnd" ON)
 ie_dependent_option(NGRAPH_USE_PROTOBUF_LITE "Compiles and links with protobuf-lite" ON
     "NGRAPH_ONNX_FRONTEND_ENABLE" OFF)
 ie_dependent_option(NGRAPH_USE_SYSTEM_PROTOBUF "Use system protobuf" OFF
@@ -130,7 +130,7 @@ ie_dependent_option(NGRAPH_USE_SYSTEM_PROTOBUF "Use system protobuf" OFF
 ie_dependent_option(NGRAPH_UNIT_TEST_ENABLE "Enables ngraph unit tests" ON "ENABLE_TESTS;NOT ANDROID" OFF)
 ie_dependent_option(NGRAPH_UNIT_TEST_BACKENDS_ENABLE "Control the building of unit tests using backends" ON
     "NGRAPH_UNIT_TEST_ENABLE" OFF)
-ie_option(NGRAPH_DEBUG_ENABLE "Enable output for NGRAPH_DEBUG statements" OFF)
+ie_option(OPENVINO_DEBUG_ENABLE "Enable output for OPENVINO_DEBUG statements" OFF)
 ie_option(ENABLE_REQUIREMENTS_INSTALL "Dynamic dependencies install" ON)
 
 # WA for ngraph python build on Windows debug
diff --git a/cmake/templates/OpenVINOConfig.cmake.in b/cmake/templates/OpenVINOConfig.cmake.in
index 14fc57b36c2..eb903e14889 100644
--- a/cmake/templates/OpenVINOConfig.cmake.in
+++ b/cmake/templates/OpenVINOConfig.cmake.in
@@ -63,6 +63,9 @@
 #   `OpenVINO_Frontend_PaddlePaddle_FOUND`
 #   OpenVINO PaddlePaddle frontend is available
 #
+#   `OpenVINO_Frontend_IR_FOUND`
+#   OpenVINO IR frontend is available
+#
 #  OpenVINO version variables:
 #
 #   `OpenVINO_VERSION_MAJOR`
@@ -169,6 +172,7 @@ set(${CMAKE_FIND_PACKAGE_NAME}_PaddlePaddle_FOUND @NGRAPH_PDPD_FRONTEND_ENABLE@)
 
 set(${CMAKE_FIND_PACKAGE_NAME}_Frontend_ONNX_FOUND ${${CMAKE_FIND_PACKAGE_NAME}_ONNX_FOUND})
 set(${CMAKE_FIND_PACKAGE_NAME}_Frontend_PaddlePaddle_FOUND ${${CMAKE_FIND_PACKAGE_NAME}_PaddlePaddle_FOUND})
+set(${CMAKE_FIND_PACKAGE_NAME}_Frontend_IR_FOUND ${${CMAKE_FIND_PACKAGE_NAME}_IR_FOUND})
 
 # if no components specified, only Runtime is provided
 if(NOT ${CMAKE_FIND_PACKAGE_NAME}_FIND_COMPONENTS)
diff --git a/cmake/templates/ngraphConfig.cmake.in b/cmake/templates/ngraphConfig.cmake.in
index a94e6b50a58..c5b467f2dd3 100644
--- a/cmake/templates/ngraphConfig.cmake.in
+++ b/cmake/templates/ngraphConfig.cmake.in
@@ -88,5 +88,6 @@ if(ngraph_onnx_importer_FOUND)
 endif()
 
 set(ngraph_paddlepaddle_frontend_FOUND ${OpenVINO_Frontend_PaddlePaddle_FOUND})
+set(ngraph_ir_frontend_FOUND ${OpenVINO_Frontend_IR_FOUND})
 
 check_required_components(ngraph)
diff --git a/cmake/test_model_zoo.cmake b/cmake/test_model_zoo.cmake
index 580cab35ec4..00e360e3800 100644
--- a/cmake/test_model_zoo.cmake
+++ b/cmake/test_model_zoo.cmake
@@ -2,6 +2,8 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
+set_property(GLOBAL PROPERTY JOB_POOLS four_jobs=4)
+
 function(ov_model_convert SRC DST OUT)
     set(onnx_gen_script ${OpenVINO_SOURCE_DIR}/ngraph/test/models/onnx/onnx_prototxt_converter.py)
 
@@ -43,6 +45,7 @@ function(ov_model_convert SRC DST OUT)
                     "${SRC}/${in_file}" ${full_out_name}
                 DEPENDS ${onnx_gen_script} "${SRC}/${in_file}"
                 COMMENT "Generate ${rel_out_name}"
+                JOB_POOL four_jobs
                 WORKING_DIRECTORY "${model_source_dir}")
         else()
             add_custom_command(OUTPUT ${full_out_name}
@@ -50,6 +53,7 @@ function(ov_model_convert SRC DST OUT)
                     "${SRC}/${in_file}" ${full_out_name}
                 DEPENDS ${onnx_gen_script} "${SRC}/${in_file}"
                 COMMENT "Copy ${rel_out_name}"
+                JOB_POOL four_jobs
                 WORKING_DIRECTORY "${model_source_dir}")
         endif()
         list(APPEND files "${full_out_name}")
diff --git a/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_RNNT.md b/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_RNNT.md
index 31de647f379..a304a0bb6b2 100644
--- a/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_RNNT.md
+++ b/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_RNNT.md
@@ -73,19 +73,21 @@ inp = torch.randn([seq_length, batch_size, feature_length])
 feature_length = torch.LongTensor([seq_length])
 x_padded, x_lens = model.encoder(inp, feature_length)
 torch.onnx.export(model.encoder, (inp, feature_length), "rnnt_encoder.onnx", opset_version=12,
-                  input_names=['input.1', '1'], dynamic_axes={'input.1': {0: 'seq_len', 1: 'batch'}})
+                  input_names=['input', 'feature_length'], output_names=['x_padded', 'x_lens'],
+                  dynamic_axes={'input': {0: 'seq_len', 1: 'batch'}})
 
 symbol = torch.LongTensor([[20]])
 hidden = torch.randn([2, batch_size, 320]), torch.randn([2, batch_size, 320])
 g, hidden = model.prediction.forward(symbol, hidden)
 torch.onnx.export(model.prediction, (symbol, hidden), "rnnt_prediction.onnx", opset_version=12,
-                  input_names=['input.1', '1', '2'],
-                  dynamic_axes={'input.1': {0: 'batch'}, '1': {1: 'batch'}, '2': {1: 'batch'}})
+                  input_names=['symbol', 'hidden_in_1', 'hidden_in_2'],
+                  output_names=['g', 'hidden_out_1', 'hidden_out_2'],
+                  dynamic_axes={'symbol': {0: 'batch'}, 'hidden_in_1': {1: 'batch'}, 'hidden_in_2': {1: 'batch'}})
 
 f = torch.randn([batch_size, 1, 1024])
 model.joint.forward(f, g)
 torch.onnx.export(model.joint, (f, g), "rnnt_joint.onnx", opset_version=12,
-                  input_names=['0', '1'], dynamic_axes={'0': {0: 'batch'}, '1': {0: 'batch'}})
+                  input_names=['0', '1'], output_names=['result'], dynamic_axes={'0': {0: 'batch'}, '1': {0: 'batch'}})
 ```
 
 ```bash
@@ -97,10 +99,10 @@ After completing this step, the files `rnnt_encoder.onnx`, `rnnt_prediction.onnx
 **Step 6**. Run the conversion command:
 
 ```bash
-python3 {path_to_openvino}/mo.py --input_model rnnt_encoder.onnx --input "input.1[157 1 240],1->157"
-python3 {path_to_openvino}/mo.py --input_model rnnt_prediction.onnx --input "input.1[1 1],1[2 1 320],2[2 1 320]"
+python3 {path_to_openvino}/mo.py --input_model rnnt_encoder.onnx --input "input[157 1 240],feature_length->157"
+python3 {path_to_openvino}/mo.py --input_model rnnt_prediction.onnx --input "symbol[1 1],hidden_in_1[2 1 320],hidden_in_2[2 1 320]"
 python3 {path_to_openvino}/mo.py --input_model rnnt_joint.onnx --input "0[1 1 1024],1[1 1 320]"
 ```
 Please note that hardcoded value for sequence length = 157 was taken from the MLCommons but conversion to IR preserves 
 network [reshapeability](../../../../IE_DG/ShapeInference.md), this means you can change input shapes manually to any value either during conversion or 
-inference.
\ No newline at end of file
+inference.
diff --git a/docs/index.md b/docs/index.md
index 9ad04bfe960..7cc4eb90f7b 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -104,3 +104,9 @@ Intel® Distribution of OpenVINO™ toolkit includes the following components:
 - [Intel® Media SDK](https://software.intel.com/en-us/media-sdk) (in Intel® Distribution of OpenVINO™ toolkit for Linux only)
 
 OpenVINO™ Toolkit opensource version is available on [GitHub](https://github.com/openvinotoolkit/openvino). For building the Inference Engine from the source code, see the <a href="https://github.com/openvinotoolkit/openvino/wiki/BuildingCode">build instructions</a>.
+
+
+## OpenVINO™ API 2.0 
+
+The new OpenVINO™ API 2.0 was introduced to make OpenVINO™ interface more user-friendly and align OpenVINO™ with other frameworks.
+The [migration guide](@ref ov_2_0_transition_guide) should allow to simplify the process of migration application from old API to OpenVINO™ API 2.0.
diff --git a/docs/migration_ov_2_0/docs/common_inference_pipeline.md b/docs/migration_ov_2_0/docs/common_inference_pipeline.md
new file mode 100644
index 00000000000..af2dbf25304
--- /dev/null
+++ b/docs/migration_ov_2_0/docs/common_inference_pipeline.md
@@ -0,0 +1,55 @@
+# OpenVINO™ Inference Pipeline {#ov_inference_pipeline}
+
+Usually to inference network with the OpenVINO™ toolkit users need to do next steps:
+ 1. Create Core
+ 2. (Optional) Read model from the disk
+     2.1. Configure Input and Output of the Model
+ 3. Load the Model to the Device
+ 4. Create an Inference Request
+ 5. Prepare Input
+ 6. Start Inference
+ 7. Process the Inference Results
+
+Code snippets below cover these steps and show how application code should be changed for migration to OpenVINO™ 2.0.
+
+## 1. Create Core
+
+Inference Engine API:
+
+@snippet snippets/ie_common.cpp ie:create_core
+
+OpenVINO™ 2.0 API:
+
+@snippet snippets/ov_common.cpp ov_api_2_0:create_core
+
+## 2. (Optional) Read model from the disk
+
+Inference Engine API:
+
+@snippet snippets/ie_common.cpp ie:read_model
+
+OpenVINO™ 2.0 API:
+
+@snippet snippets/ov_common.cpp ov_api_2_0:read_model
+
+### 2.1 Configure Input and Output of the Model
+
+Inference Engine API:
+
+@snippet snippets/ie_common.cpp ie:get_inputs_outputs
+
+OpenVINO™ 2.0 API:
+
+@snippet snippets/ov_common.cpp ov_api_2_0:get_inputs_outputs
+
+## 3. Load the Model to the Device
+
+Inference Engine API:
+
+@snippet snippets/ie_common.cpp ie:compile_model
+
+OpenVINO™ 2.0 API:
+
+@snippet snippets/ov_common.cpp ov_api_2_0:compile_model
+
+## 5. TBD
diff --git a/docs/migration_ov_2_0/docs/intro.md b/docs/migration_ov_2_0/docs/intro.md
new file mode 100644
index 00000000000..5d89b7aff3d
--- /dev/null
+++ b/docs/migration_ov_2_0/docs/intro.md
@@ -0,0 +1,12 @@
+# OpenVINO™ API 2.0 transition guide {#ov_2_0_transition_guide}
+
+The OpenVINO™ API 2.0 introduced in order to simplify migration from other frameworks and make the OpenVINO™ API more user-friendly.
+The list with differences between APIs below:
+
+ - OpenVINO™ API 2.0 uses tensor names or indexes to work with Inputs or Outputs, the old API works with operation names.
+ - Structures for Shapes, element types were changed.
+ - Naming style was changed. The old API uses CamelCaseStyle and OpenVINO™ API 2.0 uses snake_case for function names.
+ - Namespaces were aligned between components.
+
+Please look at next transition guides to understand how transit own application to OpenVINO™ API 2.0.
+ - [OpenVINO™ Common Inference pipeline](@ref ov_inference_pipeline)
diff --git a/docs/nGraph_DG/nGraph_debug_capabilities.md b/docs/nGraph_DG/nGraph_debug_capabilities.md
index e2ae82743c1..bda4dff150c 100644
--- a/docs/nGraph_DG/nGraph_debug_capabilities.md
+++ b/docs/nGraph_DG/nGraph_debug_capabilities.md
@@ -3,7 +3,7 @@
 nGraph representation provides an API to get detailed information about the graph structure.
 
 To receive additional messages about applied graph modifications, rebuild the nGraph library with 
-the `-DNGRAPH_DEBUG_ENABLE=ON` option.
+the `-DOPENVINO_DEBUG_ENABLE=ON` option.
 
 To visualize the nGraph function to the xDot format or to an image file, use the 
 `ngraph::pass::VisualizeTree` graph transformation pass:
diff --git a/docs/snippets/ie_common.cpp b/docs/snippets/ie_common.cpp
new file mode 100644
index 00000000000..6a558129243
--- /dev/null
+++ b/docs/snippets/ie_common.cpp
@@ -0,0 +1,43 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <ie_core.hpp>
+
+int main() {
+    //! [ie:create_core]
+    InferenceEngine::Core core;
+    //! [ie:create_core]
+
+    //! [ie:read_model]
+    InferenceEngine::CNNNetwork network = core.ReadNetwork("model.xml");
+    //! [ie:read_model]
+
+    //! [ie:get_inputs_outputs]
+    InferenceEngine::InputsDataMap inputs = network.getInputsInfo();
+    InferenceEngine::OutputsDataMap outputs = network.getOutputsInfo();
+    //! [ie:get_inputs_outputs]
+
+    //! [ie:compile_model]
+    InferenceEngine::ExecutableNetwork exec_network = core.LoadNetwork(network, "CPU");
+    //! [ie:compile_model]
+
+    //! [ie:create_infer_request]
+    InferenceEngine::InferRequest infer_request = exec_network.CreateInferRequest();
+    //! [ie:create_infer_request]
+
+    //! [ie:get_input_tensor]
+    InferenceEngine::Blob::Ptr input_blob = infer_request.GetBlob(inputs.begin()->first);
+    // fill input blob
+    //! [ie:get_input_tensor]
+
+    //! [ie:inference]
+    infer_request.Infer();
+    //! [ie:inference]
+
+    //! [ie:get_output_tensor]
+    InferenceEngine::Blob::Ptr output_blob = infer_request.GetBlob(outputs.begin()->first);
+    // process output data
+    //! [ie:get_output_tensor]
+    return 0;
+}
diff --git a/docs/snippets/nGraphTutorial.cpp b/docs/snippets/nGraphTutorial.cpp
index 6011becf4ec..e39e783d5eb 100644
--- a/docs/snippets/nGraphTutorial.cpp
+++ b/docs/snippets/nGraphTutorial.cpp
@@ -23,12 +23,10 @@ acos0->set_argument(0, add0);
 add1->set_argument(0, acos0);
 add1->set_argument(1, abs0);
 
-// Run shape inference on the nodes
-NodeVector ops{arg0, arg1, add0, abs0, acos0, add1};
-validate_nodes_and_infer_types(ops);
-
 // Create a graph with one output (add1) and four inputs (arg0, arg1)
 auto ng_function = make_shared<Function>(OutputVector{add1}, ParameterVector{arg0, arg1});
+// Run shape inference on the nodes
+ng_function->validate_nodes_and_infer_types();
 
 //! [part0]
 
diff --git a/docs/snippets/ov_common.cpp b/docs/snippets/ov_common.cpp
new file mode 100644
index 00000000000..7cb9e344f7c
--- /dev/null
+++ b/docs/snippets/ov_common.cpp
@@ -0,0 +1,34 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+#include <openvino/core/function.hpp>
+#include <openvino/runtime/runtime.hpp>
+
+int main() {
+    //! [ov_api_2_0:create_core]
+    ov::runtime::Core core;
+    //! [ov_api_2_0:create_core]
+
+    //! [ov_api_2_0:read_model]
+    std::shared_ptr<ov::Function> network = core.read_model("model.xml");
+    //! [ov_api_2_0:read_model]
+
+    //! [ov_api_2_0:get_inputs_outputs]
+    ov::ParameterVector inputs = network->get_parameters();
+    ov::ResultVector outputs = network->get_results();
+    //! [ov_api_2_0:get_inputs_outputs]
+
+    //! [ov_api_2_0:compile_model]
+    ov::runtime::ExecutableNetwork exec_network = core.compile_model(network, "CPU");
+    //! [ov_api_2_0:compile_model]
+
+    ov::runtime::InferRequest infer_request = exec_network.create_infer_request();
+    //
+    // InferenceEngine::Blob::Ptr input_blob = infer_request.GetBlob(inputs.begin()->first);
+    // // fill input blob
+    // infer_request.Infer();
+    //
+    // InferenceEngine::Blob::Ptr output_blob = infer_request.GetBlob(outputs.begin()->first);
+    // process output data
+    return 0;
+}
diff --git a/inference-engine/cmake/vpu_dependencies.cmake b/inference-engine/cmake/vpu_dependencies.cmake
index e6ec3799a3c..00cf63344ce 100644
--- a/inference-engine/cmake/vpu_dependencies.cmake
+++ b/inference-engine/cmake/vpu_dependencies.cmake
@@ -110,8 +110,6 @@ if(ANDROID)
 
     set(LIBUSB_INCLUDE_DIR "${LIBUSB}/include")
     set(LIBUSB_LIBRARY "${LIBUSB}/libs/${ANDROID_ABI}/libusb1.0.so")
-
-    log_rpath_from_dir(LIBUSB "${LIBUSB}/libs/${ANDROID_ABI}")
 endif()
 
 #
diff --git a/inference-engine/ie_bridges/python/sample/speech_sample/README.md b/inference-engine/ie_bridges/python/sample/speech_sample/README.md
index 54403416bc4..2809cc72a5f 100644
--- a/inference-engine/ie_bridges/python/sample/speech_sample/README.md
+++ b/inference-engine/ie_bridges/python/sample/speech_sample/README.md
@@ -89,15 +89,15 @@ optional arguments:
                         Path to an .xml file with a trained model (required if
                         -rg is missing).
   -rg IMPORT_GNA_MODEL, --import_gna_model IMPORT_GNA_MODEL
-                        Read GNA model from file using path/filename provided 
+                        Read GNA model from file using path/filename provided
                         (required if -m is missing).
 
 Options:
   -h, --help            Show this help message and exit.
   -i INPUT, --input INPUT
-                        Required. Path to an input file (.ark or .npz).       
+                        Required. Path to an input file (.ark or .npz).
   -o OUTPUT, --output OUTPUT
-                        Optional. Output file name to save inference results  
+                        Optional. Output file name to save inference results
                         (.ark or .npz).
   -r REFERENCE, --reference REFERENCE
                         Optional. Read reference score file and compare
@@ -117,7 +117,8 @@ Options:
                         (default 16).
   -sf SCALE_FACTOR, --scale_factor SCALE_FACTOR
                         Optional. The user-specified input scale factor for
-                        quantization.
+                        quantization. If the network contains multiple inputs,
+                        provide scale factors by separating them with commas.
   -wg EXPORT_GNA_MODEL, --export_gna_model EXPORT_GNA_MODEL
                         Optional. Write GNA model to file using path/filename
                         provided.
@@ -176,27 +177,30 @@ The sample application logs each step in a standard output stream.
 [ INFO ] Creating Inference Engine
 [ INFO ] Reading the network: wsj_dnn5b.xml
 [ INFO ] Configuring input and output blobs
-[ INFO ] Using scale factor of 2175.4322417 calculated from first utterance.
+[ INFO ] Using scale factor(s) calculated from first utterance
+[ INFO ] For input 0 using scale factor of 2175.4322418
 [ INFO ] Loading the model to the plugin
 [ INFO ] Starting inference in synchronous mode
 [ INFO ] Utterance 0 (4k0c0301)
+[ INFO ] Output blob name: affinetransform14/Fused_Add_
 [ INFO ] Frames in utterance: 1294
-[ INFO ] Total time in Infer (HW and SW): 5305.47ms
-[ INFO ] max error: 0.7051839
-[ INFO ] avg error: 0.0448387
-[ INFO ] avg rms error: 0.0582387        
-[ INFO ] stdev error: 0.0371649
+[ INFO ] Total time in Infer (HW and SW): 6211.45ms
+[ INFO ] max error: 0.7051840
+[ INFO ] avg error: 0.0448388
+[ INFO ] avg rms error: 0.0582387
+[ INFO ] stdev error: 0.0371650
 [ INFO ]
 [ INFO ] Utterance 1 (4k0c0302)
+[ INFO ] Output blob name: affinetransform14/Fused_Add_
 [ INFO ] Frames in utterance: 1005
-[ INFO ] Total time in Infer (HW and SW): 5031.53ms
+[ INFO ] Total time in Infer (HW and SW): 4742.27ms
 [ INFO ] max error: 0.7575974
 [ INFO ] avg error: 0.0452166
 [ INFO ] avg rms error: 0.0586013
 [ INFO ] stdev error: 0.0372769
-[ INFO ]
 ...
-[ INFO ] Total sample time: 38033.09ms
+[ INFO ] Total sample time: 40219.99ms
+[ INFO ] File result.npz was created!
 [ INFO ] This sample is an API example, for any performance measurements please use the dedicated benchmark_app tool
 ```
 
diff --git a/inference-engine/ie_bridges/python/sample/speech_sample/arg_parser.py b/inference-engine/ie_bridges/python/sample/speech_sample/arg_parser.py
index 1d2ad5c7d71..d4e2b345ea2 100644
--- a/inference-engine/ie_bridges/python/sample/speech_sample/arg_parser.py
+++ b/inference-engine/ie_bridges/python/sample/speech_sample/arg_parser.py
@@ -28,8 +28,9 @@ def parse_args() -> argparse.Namespace:
     args.add_argument('-bs', '--batch_size', default=1, type=int, help='Optional. Batch size 1-8 (default 1).')
     args.add_argument('-qb', '--quantization_bits', default=16, type=int,
                       help='Optional. Weight bits for quantization: 8 or 16 (default 16).')
-    args.add_argument('-sf', '--scale_factor', type=float,
-                      help='Optional. The user-specified input scale factor for quantization.')
+    args.add_argument('-sf', '--scale_factor', type=str,
+                      help='Optional. The user-specified input scale factor for quantization. '
+                      'If the network contains multiple inputs, provide scale factors by separating them with commas.')
     args.add_argument('-wg', '--export_gna_model', type=str,
                       help='Optional. Write GNA model to file using path/filename provided.')
     args.add_argument('-we', '--export_embedded_gna_model', type=str, help=argparse.SUPPRESS)
diff --git a/inference-engine/ie_bridges/python/sample/speech_sample/speech_sample.py b/inference-engine/ie_bridges/python/sample/speech_sample/speech_sample.py
index 67601e1f379..14d2e4fa441 100755
--- a/inference-engine/ie_bridges/python/sample/speech_sample/speech_sample.py
+++ b/inference-engine/ie_bridges/python/sample/speech_sample/speech_sample.py
@@ -103,6 +103,32 @@ def get_output_layer_list(net: Union[IENetwork, ExecutableNetwork],
         return [list(net.outputs.keys())[-1]]
 
 
+def parse_scale_factors(args: argparse.Namespace) -> list:
+    """Get a list of scale factors for input files"""
+    input_files = re.split(', |,', args.input)
+    scale_factors = re.split(', |,', str(args.scale_factor))
+    scale_factors = list(map(float, scale_factors))
+
+    if len(input_files) != len(scale_factors):
+        log.error(f'Incorrect command line for multiple inputs: {len(scale_factors)} scale factors provided for '
+                  f'{len(input_files)} input files.')
+        sys.exit(-7)
+
+    for i, scale_factor in enumerate(scale_factors):
+        if float(scale_factor) < 0:
+            log.error(f'Scale factor for input #{i} (counting from zero) is out of range (must be positive).')
+            sys.exit(-8)
+
+    return scale_factors
+
+
+def set_scale_factors(plugin_config: dict, scale_factors: list):
+    """Set a scale factor provided for each input"""
+    for i, scale_factor in enumerate(scale_factors):
+        log.info(f'For input {i} using scale factor of {scale_factor:.7f}')
+        plugin_config[f'GNA_SCALE_FACTOR_{i}'] = str(scale_factor)
+
+
 def main():
     log.basicConfig(format='[ %(levelname)s ] %(message)s', level=log.INFO, stream=sys.stdout)
     args = parse_args()
@@ -149,16 +175,23 @@ def main():
 
         # Set a GNA scale factor
         if args.import_gna_model:
-            log.info(f'Using scale factor from the imported GNA model: {args.import_gna_model}')
-        elif args.scale_factor:
-            log.info(f'Using scale factor of {args.scale_factor:.7f} specified by user.')
-            plugin_config['GNA_SCALE_FACTOR'] = str(args.scale_factor)
+            if args.scale_factor:
+                log.warning(f'Custom scale factor will be used for imported GNA model: {args.import_gna_model}')
+                set_scale_factors(plugin_config, parse_scale_factors(args))
+            else:
+                log.info(f'Using scale factor from the imported GNA model: {args.import_gna_model}')
         else:
-            utterances = read_utterance_file(args.input.split(',')[0])
-            key = sorted(utterances)[0]
-            scale_factor = get_scale_factor(utterances[key])
-            log.info(f'Using scale factor of {scale_factor:.7f} calculated from first utterance.')
-            plugin_config['GNA_SCALE_FACTOR'] = str(scale_factor)
+            if args.scale_factor:
+                set_scale_factors(plugin_config, parse_scale_factors(args))
+            else:
+                scale_factors = []
+
+                for file_name in re.split(', |,', args.input):
+                    first_utterance = next(iter(read_utterance_file(file_name).values()))
+                    scale_factors.append(get_scale_factor(first_utterance))
+
+                log.info('Using scale factor(s) calculated from first utterance')
+                set_scale_factors(plugin_config, scale_factors)
 
         if args.export_embedded_gna_model:
             plugin_config['GNA_FIRMWARE_MODEL_IMAGE'] = args.export_embedded_gna_model
diff --git a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.cpp b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.cpp
index fcd8613f444..a0763f79765 100644
--- a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.cpp
+++ b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.cpp
@@ -196,6 +196,10 @@ public:
         versionInfo = &ExtensionDescription;
     }
 
+    std::map<std::string, ngraph::OpSet> getOpSets() override {
+        return {{"framework_node_ext", ngraph::OpSet()}};
+    }
+
     void Unload() noexcept override {}
 };
 
diff --git a/inference-engine/ie_bridges/python/src/openvino/offline_transformations/CMakeLists.txt b/inference-engine/ie_bridges/python/src/openvino/offline_transformations/CMakeLists.txt
index 0aa8280bc5c..bc9115229e6 100644
--- a/inference-engine/ie_bridges/python/src/openvino/offline_transformations/CMakeLists.txt
+++ b/inference-engine/ie_bridges/python/src/openvino/offline_transformations/CMakeLists.txt
@@ -59,10 +59,8 @@ add_custom_command(TARGET ${TARGET_NAME}
 # ie_cpack_add_component(${PYTHON_VERSION}_dev DEPENDS ${PYTHON_COMPONENT})
 
 install(TARGETS ${TARGET_NAME}
-        RUNTIME DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/offline_transformations
-        COMPONENT ${PYTHON_COMPONENT}
-        LIBRARY DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/offline_transformations
-        COMPONENT ${PYTHON_COMPONENT})
+        RUNTIME DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/offline_transformations COMPONENT ${PYTHON_COMPONENT}
+        LIBRARY DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/offline_transformations COMPONENT ${PYTHON_COMPONENT})
 
 install(PROGRAMS __init__.py
         DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/offline_transformations
diff --git a/inference-engine/ie_bridges/python/src/openvino/test_utils/CMakeLists.txt b/inference-engine/ie_bridges/python/src/openvino/test_utils/CMakeLists.txt
index cb071162e35..c6ae33c7951 100644
--- a/inference-engine/ie_bridges/python/src/openvino/test_utils/CMakeLists.txt
+++ b/inference-engine/ie_bridges/python/src/openvino/test_utils/CMakeLists.txt
@@ -51,4 +51,17 @@ add_custom_command(TARGET ${TARGET_NAME}
 )
 
 add_clang_format_target(${TARGET_NAME}_clang FOR_TARGETS ${TARGET_NAME}
-                        EXCLUDE_PATTERNS ".*\\.cxx;.*\\.pxd;.*\\.pyx")
\ No newline at end of file
+                        EXCLUDE_PATTERNS ".*\\.cxx;.*\\.pxd;.*\\.pyx")
+
+# install
+
+install(TARGETS ${TARGET_NAME}
+        RUNTIME DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/test_utils
+        COMPONENT tests EXCLUDE_FROM_ALL
+        LIBRARY DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/test_utils
+        COMPONENT tests EXCLUDE_FROM_ALL)
+
+install(PROGRAMS __init__.py
+        DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/test_utils
+        COMPONENT tests
+        EXCLUDE_FROM_ALL)
diff --git a/inference-engine/ie_bridges/python/tests/conftest.py b/inference-engine/ie_bridges/python/tests/conftest.py
index f0e5059d040..365e2f2f368 100644
--- a/inference-engine/ie_bridges/python/tests/conftest.py
+++ b/inference-engine/ie_bridges/python/tests/conftest.py
@@ -51,10 +51,44 @@ def pytest_configure(config):
     )
 
 
-def create_ngraph_function(inputShape):
+def create_encoder(input_shape, levels = 4):
     import ngraph as ng
-    inputShape = ng.impl.PartialShape(inputShape)
-    param = ng.parameter(inputShape, dtype=np.float32, name="data")
-    result = ng.relu(param, name='out')
+    # input
+    input_node = ng.parameter(input_shape, np.float32, name="data")
+
+    padding_begin = padding_end = [0, 0]
+    strides = [1, 1]
+    dilations = [1, 1]
+    input_channels = [input_shape[1]]
+    last_output = input_node
+
+    # convolution layers
+    for i in range(levels):
+        input_c = input_channels[-1]
+        output_c = input_c * 2
+        conv_w = np.random.uniform(0, 1, [output_c, input_c, 5, 5]).astype(np.float32)
+        conv_node = ng.convolution(last_output, conv_w, strides, padding_begin, padding_end, dilations)
+        input_channels.append(output_c)
+        last_output = conv_node
+
+    # deconvolution layers
+    for i in range(levels):
+        input_c = input_channels[-2]
+        output_c = input_channels.pop(-1)
+        deconv_w = np.random.uniform(0, 1, [output_c, input_c, 5, 5]).astype(np.float32)
+        deconv_node = ng.convolution_backprop_data(last_output, deconv_w, strides)
+        last_output = deconv_node
+
+    # result
+    last_output.set_friendly_name("out")
+    result_node = ng.result(last_output)
+    return ng.Function(result_node, [input_node], "Encoder")
+
+
+def create_relu(input_shape):
+    import ngraph as ng
+    input_shape = ng.impl.PartialShape(input_shape)
+    param = ng.parameter(input_shape, dtype=np.float32, name="data")
+    result = ng.relu(param, name="out")
     function  = ng.Function(result, [param], "TestFunction")
     return function
diff --git a/inference-engine/ie_bridges/python/tests/test_Blob.py b/inference-engine/ie_bridges/python/tests/test_Blob.py
index cd2a48a2724..14624fa3daa 100644
--- a/inference-engine/ie_bridges/python/tests/test_Blob.py
+++ b/inference-engine/ie_bridges/python/tests/test_Blob.py
@@ -140,10 +140,11 @@ def test_set_shape():
 @pytest.mark.ngraph_dependent_test
 @pytest.mark.template_plugin
 def test_blob_set_shape_after_async_infer():
-    from conftest import create_ngraph_function
+    from conftest import create_encoder
     import ngraph as ng
-    function = create_ngraph_function([ng.Dimension(0,5), ng.Dimension(4), ng.Dimension(20), ng.Dimension(20)])
+    function = create_encoder([1, 4, 20, 20])
     net = ng.function_to_cnn(function)
+    net.reshape({"data": [(1, 5), 4, 20, 20]})
     ie_core = IECore()
     ie_core.register_plugin("templatePlugin", "TEMPLATE")
     exec_net = ie_core.load_network(net, "TEMPLATE")
@@ -152,3 +153,4 @@ def test_blob_set_shape_after_async_infer():
     with pytest.raises(RuntimeError) as e:
         request.input_blobs['data'].set_shape([3, 4, 20, 20])
     assert "REQUEST_BUSY" in str(e.value)
+    request.wait()
diff --git a/inference-engine/ie_bridges/python/tests/test_CDataPtr.py b/inference-engine/ie_bridges/python/tests/test_CDataPtr.py
index 4969aba4a5c..838c8c8f282 100644
--- a/inference-engine/ie_bridges/python/tests/test_CDataPtr.py
+++ b/inference-engine/ie_bridges/python/tests/test_CDataPtr.py
@@ -61,9 +61,9 @@ def test_initialized(device):
 @pytest.mark.ngraph_dependent_test
 @pytest.mark.template_plugin
 def test_is_dynamic():
-    from conftest import create_ngraph_function
+    from conftest import create_relu
     import ngraph as ng
-    function = create_ngraph_function([-1, 3, 20, 20])
+    function = create_relu([-1, 3, 20, 20])
     net = ng.function_to_cnn(function)
     ie = IECore()
     ie.register_plugin("templatePlugin", "TEMPLATE")
diff --git a/inference-engine/ie_bridges/python/tests/test_DataPtr.py b/inference-engine/ie_bridges/python/tests/test_DataPtr.py
index 40ae28b2001..27b6fec64ed 100644
--- a/inference-engine/ie_bridges/python/tests/test_DataPtr.py
+++ b/inference-engine/ie_bridges/python/tests/test_DataPtr.py
@@ -48,9 +48,9 @@ def test_initialized():
 @pytest.mark.ngraph_dependent_test
 @pytest.mark.template_plugin
 def test_is_dynamic():
-    from conftest import create_ngraph_function
+    from conftest import create_relu
     import ngraph as ng
-    function = create_ngraph_function([-1, 3, 20, 20])
+    function = create_relu([-1, 3, 20, 20])
     net = ng.function_to_cnn(function)
     assert net.input_info["data"].input_data.is_dynamic
     assert net.outputs["out"].is_dynamic
diff --git a/inference-engine/ie_bridges/python/tests/test_IENetwork.py b/inference-engine/ie_bridges/python/tests/test_IENetwork.py
index 607c8296f4b..7a6daac7214 100644
--- a/inference-engine/ie_bridges/python/tests/test_IENetwork.py
+++ b/inference-engine/ie_bridges/python/tests/test_IENetwork.py
@@ -166,9 +166,9 @@ def test_reshape():
     ([1, 3, -1, 25], [1, 3, 22, -1])
 ])
 def test_reshape_with_partial_shape(device, shape, p_shape):
-    from conftest import create_ngraph_function
+    from conftest import create_relu
     import ngraph as ng
-    function = create_ngraph_function(shape)
+    function = create_relu(shape)
     net = ng.function_to_cnn(function)
     net.reshape({"data": p_shape})
     changedFunction = ng.function_from_cnn(net)
@@ -185,9 +185,9 @@ def test_reshape_with_partial_shape(device, shape, p_shape):
 
 @pytest.mark.ngraph_dependent_test
 def test_incorrect_reshape(device):
-    from conftest import create_ngraph_function
+    from conftest import create_relu
     import ngraph as ng
-    function = create_ngraph_function([1, 3, 22, 22])
+    function = create_relu([1, 3, 22, 22])
     net = ng.function_to_cnn(function)
     with pytest.raises(ValueError) as e:
         net.reshape({"data": [(2, 4, 6), 3, 22, 22]})
@@ -287,9 +287,9 @@ def test_tensor_names():
 @pytest.mark.ngraph_dependent_test
 @pytest.mark.template_plugin
 def test_create_two_exec_net():
-    from conftest import create_ngraph_function
+    from conftest import create_relu
     import ngraph as ng
-    function = create_ngraph_function([ng.Dimension(0,5), ng.Dimension(4), ng.Dimension(20), ng.Dimension(20)])
+    function = create_relu([ng.Dimension(0,5), ng.Dimension(4), ng.Dimension(20), ng.Dimension(20)])
     net = ng.function_to_cnn(function)
     ie_core = IECore()
     ie_core.register_plugin("templatePlugin", "TEMPLATE")
diff --git a/inference-engine/ie_bridges/python/tests/test_InferRequest.py b/inference-engine/ie_bridges/python/tests/test_InferRequest.py
index a1ea7ce8bce..f82cbf5327f 100644
--- a/inference-engine/ie_bridges/python/tests/test_InferRequest.py
+++ b/inference-engine/ie_bridges/python/tests/test_InferRequest.py
@@ -589,13 +589,13 @@ def test_query_state_write_buffer(device, input_shape, data_type, mode):
 @pytest.mark.parametrize("shape, p_shape, ref_shape", [
     ([1, 4, 20, 20], [-1, 4, 20, 20], [5, 4, 20, 20]),
     ([1, 4, 20, 20], [(0,5), 4, 20, 20], [3, 4, 20, 20]),
-    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [2, 4, 20, 20]),
-    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [6, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 4, 20, 20], [2, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 4, 20, 20], [6, 4, 20, 20]),
 ])
 def test_infer_dynamic_network_with_set_shape(shape, p_shape, ref_shape):
-    from conftest import create_ngraph_function
+    from conftest import create_encoder
     import ngraph as ng
-    function = create_ngraph_function(shape)
+    function = create_encoder(shape)
     net = ng.function_to_cnn(function)
     net.reshape({"data": p_shape})
     ie_core = ie.IECore()
@@ -616,13 +616,13 @@ def test_infer_dynamic_network_with_set_shape(shape, p_shape, ref_shape):
 @pytest.mark.parametrize("shape, p_shape, ref_shape", [
     ([1, 4, 20, 20], [-1, 4, 20, 20], [5, 4, 20, 20]),
     ([1, 4, 20, 20], [(0,5), 4, 20, 20], [3, 4, 20, 20]),
-    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [2, 4, 20, 20]),
-    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [6, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 4, 20, 20], [2, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 4, 20, 20], [6, 4, 20, 20]),
 ])
 def test_infer_dynamic_network_without_set_shape(shape, p_shape, ref_shape):
-    from conftest import create_ngraph_function
+    from conftest import create_encoder
     import ngraph as ng
-    function = create_ngraph_function(shape)
+    function = create_encoder(shape)
     net = ng.function_to_cnn(function)
     net.reshape({"data": p_shape})
     ie_core = ie.IECore()
@@ -642,13 +642,13 @@ def test_infer_dynamic_network_without_set_shape(shape, p_shape, ref_shape):
 @pytest.mark.parametrize("shape, p_shape, ref_shape", [
     ([1, 4, 20, 20], [-1, 4, 20, 20], [5, 4, 20, 20]),
     ([1, 4, 20, 20], [(0,5), 4, 20, 20], [3, 4, 20, 20]),
-    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [2, 4, 20, 20]),
-    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [6, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 4, 20, 20], [2, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 4, 20, 20], [6, 4, 20, 20]),
 ])
 def test_infer_dynamic_network_with_set_blob(shape, p_shape, ref_shape):
-    from conftest import create_ngraph_function
+    from conftest import create_encoder
     import ngraph as ng
-    function = create_ngraph_function(shape)
+    function = create_encoder(shape)
     net = ng.function_to_cnn(function)
     net.reshape({"data": p_shape})
     ie_core = ie.IECore()
@@ -670,11 +670,11 @@ def test_infer_dynamic_network_with_set_blob(shape, p_shape, ref_shape):
 @pytest.mark.ngraph_dependent_test
 @pytest.mark.template_plugin
 def test_infer_dynamic_network_twice():
-    from conftest import create_ngraph_function
+    from conftest import create_encoder
     import ngraph as ng
     shape, p_shape = [1, 4, 20, 20], [(0,5), 4, 20, 20]
     ref_shape1, ref_shape2 = [2, 4, 20, 20], [3, 4, 20, 20]
-    function = create_ngraph_function(shape)
+    function = create_encoder(shape)
     net = ng.function_to_cnn(function)
     net.reshape({"data": p_shape})
     ie_core = ie.IECore()
@@ -692,11 +692,11 @@ def test_infer_dynamic_network_twice():
 @pytest.mark.ngraph_dependent_test
 @pytest.mark.template_plugin
 def test_infer_dynamic_network_with_set_blob_twice():
-    from conftest import create_ngraph_function
+    from conftest import create_encoder
     import ngraph as ng
     shape, p_shape = [1, 4, 20, 20], [(0,5), 4, 20, 20]
     ref_shape1, ref_shape2 = [2, 4, 20, 20], [3, 4, 20, 20]
-    function = create_ngraph_function(shape)
+    function = create_encoder(shape)
     net = ng.function_to_cnn(function)
     net.reshape({"data": p_shape})
     ie_core = ie.IECore()
@@ -723,14 +723,14 @@ def test_infer_dynamic_network_with_set_blob_twice():
 @pytest.mark.template_plugin
 @pytest.mark.parametrize("shapes", [
     ([3, 4, 20, 20], [3, 4, 20, 20], [3, 4, 20, 20]),
-    ([3, 4, 20, 20], [3, 6, 20, 20], [3, 8, 20, 20]),
+    ([3, 4, 20, 20], [3, 4, 28, 28], [3, 4, 45, 45]),
 ])
 def test_async_infer_dynamic_network_3_requests(shapes):
-    from conftest import create_ngraph_function
+    from conftest import create_encoder
     import ngraph as ng
-    function = create_ngraph_function([3, 4, 20, 20])
+    function = create_encoder([3, 4, 20, 20])
     net = ng.function_to_cnn(function)
-    net.reshape({"data": [3, (2, 10), 20, 20]})
+    net.reshape({"data": [3, 4, (20, 50), (20, 50)]})
     ie_core = ie.IECore()
     ie_core.register_plugin("templatePlugin", "TEMPLATE")
     exec_net = ie_core.load_network(net, "TEMPLATE", num_requests=3)
@@ -745,9 +745,9 @@ def test_async_infer_dynamic_network_3_requests(shapes):
 @pytest.mark.ngraph_dependent_test
 @pytest.mark.template_plugin
 def test_set_blob_with_incorrect_name():
-    from conftest import create_ngraph_function
+    from conftest import create_encoder
     import ngraph as ng
-    function = create_ngraph_function([4, 4, 20, 20])
+    function = create_encoder([4, 4, 20, 20])
     net = ng.function_to_cnn(function)
     ie_core = ie.IECore()
     ie_core.register_plugin("templatePlugin", "TEMPLATE")
@@ -763,9 +763,9 @@ def test_set_blob_with_incorrect_name():
 @pytest.mark.ngraph_dependent_test
 @pytest.mark.template_plugin
 def test_set_blob_with_incorrect_size():
-    from conftest import create_ngraph_function
+    from conftest import create_encoder
     import ngraph as ng
-    function = create_ngraph_function([4, 4, 20, 20])
+    function = create_encoder([4, 4, 20, 20])
     net = ng.function_to_cnn(function)
     ie_core = ie.IECore()
     ie_core.register_plugin("templatePlugin", "TEMPLATE")
@@ -773,6 +773,7 @@ def test_set_blob_with_incorrect_size():
     tensor_desc = exec_net.requests[0].input_blobs["data"].tensor_desc
     tensor_desc.dims = [tensor_desc.dims[0]*2, 4, 20, 20]
     blob = ie.Blob(tensor_desc)
+    print(exec_net.requests[0].output_blobs)
     with pytest.raises(RuntimeError) as e:
         exec_net.requests[0].set_blob("data", blob)
     assert f"Input blob size is not equal network input size" in str(e.value)
@@ -784,10 +785,11 @@ def test_set_blob_with_incorrect_size():
 @pytest.mark.ngraph_dependent_test
 @pytest.mark.template_plugin
 def test_set_blob_after_async_infer():
-    from conftest import create_ngraph_function
+    from conftest import create_encoder
     import ngraph as ng
-    function = create_ngraph_function([ng.Dimension(0,5), ng.Dimension(4), ng.Dimension(20), ng.Dimension(20)])
+    function = create_encoder([1, 4, 20, 20])
     net = ng.function_to_cnn(function)
+    net.reshape({"data": [(0, 5), 4, 20, 20]})
     ie_core = ie.IECore()
     ie_core.register_plugin("templatePlugin", "TEMPLATE")
     exec_net = ie_core.load_network(net, "TEMPLATE")
@@ -799,3 +801,4 @@ def test_set_blob_after_async_infer():
     with pytest.raises(RuntimeError) as e:
         request.set_blob("data", blob)
     assert "REQUEST_BUSY" in str(e.value)
+    request.wait()
diff --git a/inference-engine/ie_bridges/python/tests/test_NGraph.py b/inference-engine/ie_bridges/python/tests/test_NGraph.py
index 139d132eb0f..13d2061ecbb 100644
--- a/inference-engine/ie_bridges/python/tests/test_NGraph.py
+++ b/inference-engine/ie_bridges/python/tests/test_NGraph.py
@@ -6,14 +6,14 @@ import ngraph as ng
 from ngraph.impl.op import Parameter
 from ngraph.impl import Function, Shape, Type
 
-from conftest import model_path, create_ngraph_function
+from conftest import model_path, create_relu
 
 
 test_net_xml, test_net_bin = model_path()
 
 
 def test_create_IENetwork_from_nGraph():
-    func = create_ngraph_function([1, 3, 22, 22])
+    func = create_relu([1, 3, 22, 22])
     caps = Function.to_capsule(func)
     cnnNetwork = IENetwork(caps)
     assert cnnNetwork != None
@@ -23,7 +23,7 @@ def test_create_IENetwork_from_nGraph():
 
 
 def test_get_IENetwork_from_nGraph():
-    func = create_ngraph_function([1, 3, 22, 22])
+    func = create_relu([1, 3, 22, 22])
     caps = Function.to_capsule(func)
     cnnNetwork = IENetwork(caps)
     assert cnnNetwork != None
diff --git a/inference-engine/samples/benchmark_app/CMakeLists.txt b/inference-engine/samples/benchmark_app/CMakeLists.txt
index b37495e5e43..e3412774f27 100644
--- a/inference-engine/samples/benchmark_app/CMakeLists.txt
+++ b/inference-engine/samples/benchmark_app/CMakeLists.txt
@@ -2,11 +2,46 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
+set(TARGET_NAME "benchmark_app")
+
 file (GLOB SRC ${CMAKE_CURRENT_SOURCE_DIR}/*.cpp)
 file (GLOB HDR ${CMAKE_CURRENT_SOURCE_DIR}/*.hpp)
 
-ie_add_sample(NAME benchmark_app
+ie_add_sample(NAME ${TARGET_NAME}
               SOURCES ${SRC}
               HEADERS ${HDR}
               DEPENDENCIES format_reader ie_samples_utils
               OPENCV_DEPENDENCIES core)
+
+find_package(OpenCL)
+
+find_path(OpenCL_HPP_INCLUDE_DIR
+    NAMES
+      CL/cl2.hpp OpenCL/cl2.hpp
+    HINTS
+      ${opencl_root_hints}
+      ENV "PROGRAMFILES(X86)"
+      ENV AMDAPPSDKROOT
+      ENV INTELOCLSDKROOT
+      ENV NVSDKCOMPUTE_ROOT
+      ENV CUDA_PATH
+      ENV ATISTREAMSDKROOT
+      ENV OCL_ROOT
+    PATH_SUFFIXES
+      include
+      OpenCL/common/inc
+      "AMD APP/include")
+
+if(OPENCL_HEADERS_DIR)
+    # Use OpenCL CPP headers from sources if present
+    set(OpenCL_HEADERS OPENCL_HEADERS_DIR)
+elseif(OpenCL_HPP_INCLUDE_DIR)
+    # Append OpenCL CPP headers to C headers and use both
+    set(OpenCL_HEADERS OpenCL_INCLUDE_DIR OpenCL_HPP_INCLUDE_DIR)
+endif()
+
+if(OpenCL_FOUND AND OpenCL_HEADERS)
+    target_link_libraries(${TARGET_NAME} PRIVATE OpenCL::OpenCL)
+    target_include_directories(${TARGET_NAME} PRIVATE ${OpenCL_HEADERS})
+    target_compile_definitions(${TARGET_NAME} PRIVATE HAVE_GPU_DEVICE_MEM_SUPPORT)
+endif()
diff --git a/inference-engine/samples/benchmark_app/benchmark_app.hpp b/inference-engine/samples/benchmark_app/benchmark_app.hpp
index c062cee1960..6395db4ff29 100644
--- a/inference-engine/samples/benchmark_app/benchmark_app.hpp
+++ b/inference-engine/samples/benchmark_app/benchmark_app.hpp
@@ -4,6 +4,10 @@
 
 #pragma once
 
+#if defined(HAVE_GPU_DEVICE_MEM_SUPPORT)
+#    define HAVE_DEVICE_MEM_SUPPORT
+#endif
+
 #include <gflags/gflags.h>
 
 #include <iostream>
@@ -132,6 +136,12 @@ static const char progress_message[] =
 // @brief message for performance counters option
 static const char pc_message[] = "Optional. Report performance counters.";
 
+#ifdef HAVE_DEVICE_MEM_SUPPORT
+// @brief message for switching memory allocation type option
+static const char use_device_mem_message[] =
+    "Optional. Switch between host and device memory allocation for input and output buffers.";
+#endif
+
 #ifdef USE_OPENCV
 // @brief message for load config option
 static const char load_config_message[] =
@@ -266,6 +276,11 @@ DEFINE_bool(progress, false, progress_message);
 /// @brief Define flag for showing performance counters <br>
 DEFINE_bool(pc, false, pc_message);
 
+#ifdef HAVE_DEVICE_MEM_SUPPORT
+/// @brief Define flag for switching beetwen host and device memory allocation for input and output buffers
+DEFINE_bool(use_device_mem, false, use_device_mem_message);
+#endif
+
 #ifdef USE_OPENCV
 /// @brief Define flag for loading configuration file <br>
 DEFINE_string(load_config, "", load_config_message);
@@ -339,6 +354,9 @@ static void showUsage() {
     std::cout << "    -nthreads \"<integer>\"     " << infer_num_threads_message << std::endl;
     std::cout << "    -enforcebf16=<true/false>     " << enforce_bf16_message << std::endl;
     std::cout << "    -pin \"YES\"/\"HYBRID_AWARE\"/\"NO\"/\"NUMA\"   " << infer_threads_pinning_message << std::endl;
+#ifdef HAVE_DEVICE_MEM_SUPPORT
+    std::cout << "    -use_device_mem           " << use_device_mem_message << std::endl;
+#endif
     std::cout << std::endl << "  Statistics dumping options:" << std::endl;
     std::cout << "    -report_type \"<type>\"     " << report_type_message << std::endl;
     std::cout << "    -report_folder            " << report_folder_message << std::endl;
diff --git a/inference-engine/samples/benchmark_app/infer_request_wrap.hpp b/inference-engine/samples/benchmark_app/infer_request_wrap.hpp
index 5e15f597e7e..dd10a28eb7a 100644
--- a/inference-engine/samples/benchmark_app/infer_request_wrap.hpp
+++ b/inference-engine/samples/benchmark_app/infer_request_wrap.hpp
@@ -65,6 +65,10 @@ public:
         return _request.GetBlob(name);
     }
 
+    void setBlob(const std::string& name, const InferenceEngine::Blob::Ptr& data) {
+        _request.SetBlob(name, data);
+    }
+
     double getExecutionTimeInMilliseconds() const {
         auto execTime = std::chrono::duration_cast<ns>(_endTime - _startTime);
         return static_cast<double>(execTime.count()) * 0.000001;
diff --git a/inference-engine/samples/benchmark_app/main.cpp b/inference-engine/samples/benchmark_app/main.cpp
index 6c643d45486..9120ce7136e 100644
--- a/inference-engine/samples/benchmark_app/main.cpp
+++ b/inference-engine/samples/benchmark_app/main.cpp
@@ -21,6 +21,7 @@
 #include "infer_request_wrap.hpp"
 #include "inputs_filling.hpp"
 #include "progress_bar.hpp"
+#include "remote_blobs_filling.hpp"
 #include "statistics_report.hpp"
 #include "utils.hpp"
 
@@ -592,7 +593,16 @@ int main(int argc, char* argv[]) {
         next_step();
 
         InferRequestsQueue inferRequestsQueue(exeNetwork, nireq);
-        fillBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests);
+        if (isFlagSetInCommandLine("use_device_mem")) {
+            if (device_name.find("GPU") == 0)
+                ::gpu::fillRemoteBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests, exeNetwork);
+            else if (device_name.find("CPU") == 0)
+                fillBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests);
+            else
+                IE_THROW() << "Requested device doesn't support `use_device_mem` option.";
+        } else {
+            fillBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests);
+        }
 
         // ----------------- 10. Measuring performance
         // ------------------------------------------------------------------
diff --git a/inference-engine/samples/benchmark_app/remote_blobs_filling.cpp b/inference-engine/samples/benchmark_app/remote_blobs_filling.cpp
new file mode 100644
index 00000000000..dc6d9fbf34a
--- /dev/null
+++ b/inference-engine/samples/benchmark_app/remote_blobs_filling.cpp
@@ -0,0 +1,140 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "remote_blobs_filling.hpp"
+
+#include <memory>
+#include <string>
+#include <utility>
+#include <vector>
+
+namespace gpu {
+
+template <typename T>
+using uniformDistribution = typename std::conditional<
+    std::is_floating_point<T>::value,
+    std::uniform_real_distribution<T>,
+    typename std::conditional<std::is_integral<T>::value, std::uniform_int_distribution<T>, void>::type>::type;
+
+template <typename T, typename T2>
+void fillBufferRandom(void* inputBuffer,
+                      size_t elementsNum,
+                      T rand_min = std::numeric_limits<uint8_t>::min(),
+                      T rand_max = std::numeric_limits<uint8_t>::max()) {
+    std::mt19937 gen(0);
+    uniformDistribution<T2> distribution(rand_min, rand_max);
+    auto inputBufferData = static_cast<T*>(inputBuffer);
+    for (size_t i = 0; i < elementsNum; i++) {
+        inputBufferData[i] = static_cast<T>(distribution(gen));
+    }
+}
+
+void fillBuffer(void* inputBuffer, size_t elementsNum, InferenceEngine::Precision precision) {
+    if (precision == InferenceEngine::Precision::FP32) {
+        fillBufferRandom<float, float>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::FP16) {
+        fillBufferRandom<short, short>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::I32) {
+        fillBufferRandom<int32_t, int32_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::I64) {
+        fillBufferRandom<int64_t, int64_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::U8) {
+        // uniform_int_distribution<uint8_t> is not allowed in the C++17
+        // standard and vs2017/19
+        fillBufferRandom<uint8_t, uint32_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::I8) {
+        // uniform_int_distribution<int8_t> is not allowed in the C++17 standard
+        // and vs2017/19
+        fillBufferRandom<int8_t, int32_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::U16) {
+        fillBufferRandom<uint16_t, uint16_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::I16) {
+        fillBufferRandom<int16_t, int16_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::BOOL) {
+        fillBufferRandom<uint8_t, uint32_t>(inputBuffer, elementsNum, 0, 1);
+    } else {
+        IE_THROW() << "Requested precision is not supported";
+    }
+}
+
+size_t getBytesPerElement(InferenceEngine::Precision precision) {
+    switch (precision) {
+    case InferenceEngine::Precision::FP32:
+        return 4;
+    case InferenceEngine::Precision::FP16:
+        return 2;
+    case InferenceEngine::Precision::I32:
+        return 4;
+    case InferenceEngine::Precision::I64:
+        return 8;
+    case InferenceEngine::Precision::U8:
+        return 1;
+    case InferenceEngine::Precision::I8:
+        return 1;
+    case InferenceEngine::Precision::U16:
+        return 2;
+    case InferenceEngine::Precision::I16:
+        return 2;
+    case InferenceEngine::Precision::BOOL:
+        return 1;
+    default:
+        IE_THROW() << "Requested precision is not supported";
+    }
+}
+
+void fillRemoteBlobs(const std::vector<std::string>& inputFiles,
+                     const size_t& batchSize,
+                     benchmark_app::InputsInfo& app_inputs_info,
+                     std::vector<InferReqWrap::Ptr> requests,
+                     const InferenceEngine::ExecutableNetwork& exeNetwork) {
+#ifdef HAVE_DEVICE_MEM_SUPPORT
+    slog::info << "Device memory will be used for input and output blobs" << slog::endl;
+    if (inputFiles.size()) {
+        slog::warn << "Device memory supports only random data at this moment, input images will be ignored"
+                   << slog::endl;
+    }
+    auto context = exeNetwork.GetContext();
+    auto oclContext = std::dynamic_pointer_cast<InferenceEngine::gpu::ClContext>(context)->get();
+    auto oclInstance = std::make_shared<OpenCL>(oclContext);
+
+    auto setShared = [&](size_t requestId,
+                         const std::string name,
+                         const InferenceEngine::TensorDesc& desc,
+                         bool fillRandom = false) {
+        cl_int err;
+        auto inputDims = desc.getDims();
+        auto elementsNum = std::accumulate(begin(inputDims), end(inputDims), 1, std::multiplies<size_t>());
+        auto inputSize = elementsNum * getBytesPerElement(desc.getPrecision());
+
+        cl::Buffer sharedBuffer =
+            cl::Buffer(oclInstance->_context, CL_MEM_READ_WRITE, (cl::size_type)inputSize, NULL, &err);
+
+        if (fillRandom) {
+            void* mappedPtr = oclInstance->_queue.enqueueMapBuffer(sharedBuffer,
+                                                                   CL_TRUE,
+                                                                   CL_MEM_READ_WRITE,
+                                                                   0,
+                                                                   (cl::size_type)inputSize);
+            fillBuffer(mappedPtr, elementsNum, desc.getPrecision());
+            oclInstance->_queue.enqueueUnmapMemObject(sharedBuffer, mappedPtr);
+        }
+
+        InferenceEngine::Blob::Ptr sharedBlob = InferenceEngine::gpu::make_shared_blob(desc, context, sharedBuffer);
+
+        requests.at(requestId)->setBlob(name, sharedBlob);
+    };
+
+    for (size_t requestId = 0; requestId < requests.size(); requestId++) {
+        for (auto& item : exeNetwork.GetInputsInfo())
+            setShared(requestId, item.first, item.second->getTensorDesc(), true);
+
+        for (auto& item : exeNetwork.GetOutputsInfo())
+            setShared(requestId, item.first, item.second->getTensorDesc());
+    }
+#else
+    IE_THROW() << "Device memory requested for GPU device, but OpenCL was not linked";
+#endif
+}
+
+}  // namespace gpu
diff --git a/inference-engine/samples/benchmark_app/remote_blobs_filling.hpp b/inference-engine/samples/benchmark_app/remote_blobs_filling.hpp
new file mode 100644
index 00000000000..66e2b1b2c66
--- /dev/null
+++ b/inference-engine/samples/benchmark_app/remote_blobs_filling.hpp
@@ -0,0 +1,64 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#if defined(HAVE_GPU_DEVICE_MEM_SUPPORT)
+#    define HAVE_DEVICE_MEM_SUPPORT
+#    include <gpu/gpu_context_api_ocl.hpp>
+#endif
+
+#include <inference_engine.hpp>
+
+#include "infer_request_wrap.hpp"
+#include "utils.hpp"
+
+namespace gpu {
+
+#ifdef HAVE_DEVICE_MEM_SUPPORT
+struct OpenCL {
+    cl::Context _context;
+    cl::Device _device;
+    cl::CommandQueue _queue;
+
+    explicit OpenCL(std::shared_ptr<std::vector<cl_context_properties>> media_api_context_properties = nullptr) {
+        // get Intel GPU OCL device, create context and queue
+        {
+            std::vector<cl::Device> devices;
+            std::vector<cl::Platform> platforms;
+            const unsigned int refVendorID = 0x8086;
+
+            cl::Platform::get(&platforms);
+            for (auto& p : platforms) {
+                p.getDevices(CL_DEVICE_TYPE_GPU, &devices);
+                for (auto& d : devices) {
+                    if (refVendorID == d.getInfo<CL_DEVICE_VENDOR_ID>()) {
+                        _device = d;
+                        _context = cl::Context(_device);
+                        break;
+                    }
+                }
+            }
+
+            cl_command_queue_properties props = CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE;
+            _queue = cl::CommandQueue(_context, _device, props);
+        }
+    }
+
+    explicit OpenCL(cl_context context) {
+        // user-supplied context handle
+        _context = cl::Context(context, true);
+        _device = cl::Device(_context.getInfo<CL_CONTEXT_DEVICES>()[0].get(), true);
+
+        cl_command_queue_properties props = CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE;
+        _queue = cl::CommandQueue(_context, _device, props);
+    }
+};
+#endif
+
+void fillRemoteBlobs(const std::vector<std::string>& inputFiles,
+                     const size_t& batchSize,
+                     benchmark_app::InputsInfo& app_inputs_info,
+                     std::vector<InferReqWrap::Ptr> requests,
+                     const InferenceEngine::ExecutableNetwork& exeNetwork);
+
+}  // namespace gpu
diff --git a/inference-engine/scripts/dependencies.bat b/inference-engine/scripts/dependencies.bat
deleted file mode 100644
index 5241d428d18..00000000000
--- a/inference-engine/scripts/dependencies.bat
+++ /dev/null
@@ -1,96 +0,0 @@
-@echo off
-
-:: Copyright (C) 2018-2021 Intel Corporation
-:: SPDX-License-Identifier: Apache-2.0
-
-setlocal enabledelayedexpansion
-
-for /f "delims=" %%x in (dependencies_64.txt) do (set "%%x")
-
-for %%A in ("%MKL%") do set MKL_FILENAME=%%~nxA
-for %%A in ("%OMP%") do set OMP_FILENAME=%%~nxA
-for %%A in ("%MYRIAD%") do set MYRIAD_FILENAME=%%~nxA
-for %%A in ("%GNA%") do set GNA_FILENAME=%%~nxA
-for %%A in ("%OPENCV%") do set OPENCV_FILENAME=%%~nxA
-for %%A in ("%HDDL%") do set HDDL_FILENAME=%%~nxA
-for %%A in ("%VPU_FIRMWARE_MA2X8X%") do set VPU_FIRMWARE_MA2X8X_FILENAME=%%~nxA
-for %%A in ("%TBB%") do set TBB_FILENAME=%%~nxA
-
-call :DownloadFile MKL %MKL%
-call :DownloadFile OMP %OMP%
-call :DownloadFile MYRIAD %MYRIAD%
-call :DownloadFile GNA %GNA%
-call :DownloadFile OPENCV %OPENCV%
-call :DownloadFile HDDL %HDDL%
-call :DownloadFile VPU_FIRMWARE_MA2X8X %VPU_FIRMWARE_MA2X8X%
-call :DownloadFile TBB %TBB%
-
-for /f "delims=" %%x in (ld_library_rpath_64.txt) do (set "%%x")
-
-set PATH=%DL_SDK_TEMP%\test_dependencies\MYRIAD\%MYRIAD_FILENAME%%MYRIAD%;%PATH%
-set PATH=%DL_SDK_TEMP%\test_dependencies\MKL\%MKL_FILENAME%%MKL%;%PATH%
-set PATH=%DL_SDK_TEMP%\test_dependencies\OMP\%OMP_FILENAME%%OMP%;%PATH%
-set PATH=%DL_SDK_TEMP%\test_dependencies\GNA\%GNA_FILENAME%%GNA%;%PATH%
-set PATH=%DL_SDK_TEMP%\test_dependencies\OPENCV\%OPENCV_FILENAME%%OPENCV%;%PATH%
-set PATH=%DL_SDK_TEMP%\test_dependencies\TBB\%TBB_FILENAME%%TBB%;%PATH%
-
-set PATH=%DL_SDK_TEMP%\test_dependencies\MYRIAD\%MYRIAD_FILENAME%%MYRIAD%;%PATH%
-
-if not "%MYRIAD%"=="" (
-	if exist "%DL_SDK_TEMP%\test_dependencies\MYRIAD\%MYRIAD_FILENAME%%MYRIAD%\mvnc" (
-		echo xcopy.exe "%DL_SDK_TEMP%\test_dependencies\MYRIAD\%MYRIAD_FILENAME%%MYRIAD%" intel64  /S /I /Y /R
-		xcopy.exe "%DL_SDK_TEMP%\test_dependencies\MYRIAD\%MYRIAD_FILENAME%%MYRIAD%" intel64  /S /I /Y /R
-	)
-
-	if exist "%DL_SDK_TEMP%\test_dependencies\MYRIAD\%MYRIAD_FILENAME%%MYRIAD%\..\bin\mvnc" (
-		echo xcopy.exe "%DL_SDK_TEMP%\test_dependencies\MYRIAD\%MYRIAD_FILENAME%%MYRIAD%\..\bin\*" intel64  /S /I /Y /R
-		xcopy.exe "%DL_SDK_TEMP%\test_dependencies\MYRIAD\%MYRIAD_FILENAME%%MYRIAD%\..\bin\*" intel64  /S /I /Y /R
-	)
-)
-
-if not "%VPU_FIRMWARE_MA2X8X%"=="" (
-	if exist "%DL_SDK_TEMP%\test_dependencies\VPU\%VPU_FIRMWARE_MA2X8X_FILENAME%" (
-		echo xcopy.exe "%DL_SDK_TEMP%\test_dependencies\VPU\%VPU_FIRMWARE_MA2X8X_FILENAME%\*" intel64  /S /I /Y /R
-		xcopy.exe "%DL_SDK_TEMP%\test_dependencies\VPU\%VPU_FIRMWARE_MA2X8X_FILENAME%\*" intel64  /S /I /Y /R
-	)
-)
-
-set PATH=%DL_SDK_TEMP%\test_dependencies\HDDL\%HDDL_FILENAME%%HDDL%\..\bin;%PATH%
-
-if not "%HDDL%"=="" (
-	set HDDL_INSTALL_DIR=%DL_SDK_TEMP%\test_dependencies\HDDL\%HDDL_FILENAME%%HDDL%\..
-	if exist "%DL_SDK_TEMP%\test_dependencies\VPU\%VPU_FIRMWARE_MA2X8X_FILENAME%" (
-		echo xcopy.exe "%DL_SDK_TEMP%\test_dependencies\VPU\%VPU_FIRMWARE_MA2X8X_FILENAME%\*" %HDDL_INSTALL_DIR%\lib  /S /I /Y /R
-		xcopy.exe "%DL_SDK_TEMP%\test_dependencies\VPU\%VPU_FIRMWARE_MA2X8X_FILENAME%\*" "%HDDL_INSTALL_DIR%\lib"  /S /I /Y /R
-	)
-)
-
-echo PATH=%PATH%
-
-endlocal & set PATH=%PATH%
-
-exit /B %ERRORLEVEL%
-
-:DownloadFile
-set DEPENDENCY=%~1
-set DEPENDENCY_URL=%~2
-set DEPENDENCY_FILE=%~nx2
-set DEPENDENCY_EXT=%~x2
-
-if not "%DEPENDENCY_URL%"=="" (
-	if not exist "%DL_SDK_TEMP%\test_dependencies\%DEPENDENCY%\%DEPENDENCY_FILE%" (
-		mkdir "%DL_SDK_TEMP%\test_dependencies\%DEPENDENCY%\%DEPENDENCY_FILE%"
-		for /L %%a in (1,1,10) do (
-			powershell -command "[Net.ServicePointManager]::SecurityProtocol = [Net.SecurityProtocolType]::Tls12; iwr -outf '%DL_SDK_TEMP%\test_dependencies\%DEPENDENCY%\_%DEPENDENCY_FILE%' %DEPENDENCY_URL%"
-			call "C:\Program Files\7-Zip\7z.exe" x -y %DL_SDK_TEMP%\test_dependencies\%DEPENDENCY%\_%DEPENDENCY_FILE% -o%DL_SDK_TEMP%\test_dependencies\%DEPENDENCY%\%DEPENDENCY_FILE%
-			if !ERRORLEVEL! equ 0 goto :DownloadFileContinue
-			timeout /T 15
-		)
-	)
-)
-goto:eof
-
-:DownloadFileContinue
-if "%DEPENDENCY_EXT%" == ".txz" call "C:\Program Files\7-Zip\7z.exe" x -y %DL_SDK_TEMP%\test_dependencies\%DEPENDENCY%\%DEPENDENCY_FILE%\_%DEPENDENCY_FILE:txz=tar% -o%DL_SDK_TEMP%\test_dependencies\%DEPENDENCY%\%DEPENDENCY_FILE%
-del "%DL_SDK_TEMP%\test_dependencies\%DEPENDENCY%\_%DEPENDENCY_FILE%" /F /Q
-goto:eof
diff --git a/inference-engine/scripts/dependencies.sh b/inference-engine/scripts/dependencies.sh
deleted file mode 100755
index 640ed7e9947..00000000000
--- a/inference-engine/scripts/dependencies.sh
+++ /dev/null
@@ -1,68 +0,0 @@
-#!/bin/bash
-
-# Copyright (C) 2018-2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-if [ "$1" = "" ]; then
-        dep_arch=64
-    else
-        dep_arch=$1
-fi
-
-item_path=""
-add_path() {
-    component=$1
-    item_path=""
-    echo "Read file: dependencies_${dep_arch}.txt"
-    grep_component="\b${component}\b"
-
-    if [[ $(grep -m 1 "$grep_component" "dependencies_${dep_arch}.txt") ]];then
-        archive_path=$(grep -m 1 "$grep_component" "dependencies_${dep_arch}.txt" | sed -E "s/${component}=//g")
-        library_rpath=$(grep -m 1 "$grep_component" "ld_library_rpath_${dep_arch}.txt" | sed -E "s/${component}=//g")
-        filename=$(basename "$archive_path")
-        if [[ (! -d "$DL_SDK_TEMP/test_dependencies/$component/$filename") ||
-                (-d "$DL_SDK_TEMP/test_dependencies/$component/$filename"  &&
-                    ! $(ls -A "$DL_SDK_TEMP/test_dependencies/$component/$filename")) ]]; then
-            mkdir -p "$DL_SDK_TEMP/test_dependencies/$component/$filename"
-            wget -q "$archive_path" -O "$DL_SDK_TEMP/test_dependencies/$filename"
-            if [[ $filename == *.zip ]]; then
-                unzip "$DL_SDK_TEMP/test_dependencies/$filename" -d "$DL_SDK_TEMP/test_dependencies/$component/$filename"
-            elif [[ $filename == *.7z ]]; then
-                7za x -y "$DL_SDK_TEMP/test_dependencies/$filename" -o "$DL_SDK_TEMP/test_dependencies/$component/$filename"
-            else
-                tar xf "$DL_SDK_TEMP/test_dependencies/$filename" -C "$DL_SDK_TEMP/test_dependencies/$component/$filename"
-            fi
-            rm "$DL_SDK_TEMP/test_dependencies/$filename"
-        fi
-        item_path=$component/$filename/$library_rpath
-    fi
-}
-
-runtimes=(MKL CLDNN MYRIAD GNA DLIA OPENCV VPU_FIRMWARE_USB-MA2X8X HDDL OMP TBB AOCL_RTE LIBUSB)
-
-export_library_path() {
-    export LD_LIBRARY_PATH=$DL_SDK_TEMP/test_dependencies/$1:$LD_LIBRARY_PATH
-}
-
-export_env_variable() {
-    export "$2"="$DL_SDK_TEMP/test_dependencies/$1"
-}
-
-ma2480_path=""
-for i in "${runtimes[@]}"
-do
-   add_path "$i"
-   export_library_path "$item_path"
-   if [ "$i" == "VPU_FIRMWARE_USB-MA2X8X" ]
-   then
-       ma2480_path="$item_path"
-   fi
-   if [ "$i" == "HDDL" ]
-   then
-       cp -r "$DL_SDK_TEMP/test_dependencies/$ma2480_path/"* "$DL_SDK_TEMP/test_dependencies/$item_path"
-       export HDDL_INSTALL_DIR="$DL_SDK_TEMP/test_dependencies/$item_path/.."
-   fi
-done
-
-echo DATA_PATH="$DATA_PATH"
-export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:lib:/usr/local/lib
\ No newline at end of file
diff --git a/inference-engine/src/CMakeLists.txt b/inference-engine/src/CMakeLists.txt
index ceb077de7a7..8b198bfbf28 100644
--- a/inference-engine/src/CMakeLists.txt
+++ b/inference-engine/src/CMakeLists.txt
@@ -47,9 +47,8 @@ add_subdirectory(snippets)
 add_custom_target(ie_libraries ALL
                   DEPENDS inference_engine_transformations inference_engine_legacy
                           inference_engine inference_engine_preproc
-                          inference_engine_ir_v7_reader inference_engine_ir_reader
-                          inference_engine_lp_transformations inference_engine_snippets
-                          ir_frontend)
+                          inference_engine_ir_v7_reader ir_ngraph_frontend
+                          inference_engine_lp_transformations inference_engine_snippets)
 
 if(NGRAPH_ONNX_FRONTEND_ENABLE)
     add_dependencies(ie_libraries onnx_ngraph_frontend)
diff --git a/inference-engine/src/cldnn_engine/cldnn_config.cpp b/inference-engine/src/cldnn_engine/cldnn_config.cpp
index 28aa8063e47..533e32271bd 100644
--- a/inference-engine/src/cldnn_engine/cldnn_config.cpp
+++ b/inference-engine/src/cldnn_engine/cldnn_config.cpp
@@ -28,7 +28,7 @@ namespace CLDNNPlugin {
 
 static void createDirectory(std::string _path) {
 #if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-    std::wstring widepath = FileUtils::multiByteCharToWString(_path.c_str());
+    std::wstring widepath = ov::util::string_to_wstring(_path.c_str());
     const wchar_t* path = widepath.c_str();
 #else
     const char* path = _path.c_str();
diff --git a/inference-engine/src/cldnn_engine/cldnn_graph.cpp b/inference-engine/src/cldnn_engine/cldnn_graph.cpp
index 75ea9d2a251..49d5212d37e 100644
--- a/inference-engine/src/cldnn_engine/cldnn_graph.cpp
+++ b/inference-engine/src/cldnn_engine/cldnn_graph.cpp
@@ -60,8 +60,6 @@ CLDNNGraph::CLDNNGraph(std::shared_ptr<CLDNNGraph> graph, uint16_t stream_id)
 void CLDNNGraph::UpdateLayersMaps() {
     OV_ITT_SCOPED_TASK(itt::domains::CLDNNPlugin, "CLDNNGraph::UpdateLayersMaps");
     primitiveIDs = m_program->primitiveIDs;
-    primitivesToIRLayersMap = m_program->primitivesToIRLayersMap;
-    IRToNgraphLayersMap = m_program->IRToNgraphLayersMap;
     prevPrimitiveIDs = m_program->prevPrimitiveIDs;
     profilingIDs = m_program->profilingIDs;
     perfMap = m_program->perfMap;
@@ -219,25 +217,6 @@ std::shared_ptr<ngraph::Function> CLDNNGraph::GetExecGraphInfoByPrimitivesInfo(s
         return res;
     };
 
-    auto split_string = [](std::string src, std::string delimiter = ",") -> std::vector<std::string> {
-        std::vector<std::string> tokens;
-        std::string tokenBuf;
-        size_t prev = 0, pos = 0, srcLength = src.length(), delimLength = delimiter.length();
-        do {
-            pos = src.find(delimiter, prev);
-            if (pos == std::string::npos) {
-                pos = srcLength;
-            }
-            tokenBuf = src.substr(prev, pos - prev);
-            if (!tokenBuf.empty()) {
-                tokens.push_back(tokenBuf);
-            }
-            prev = pos + delimLength;
-        } while (pos < srcLength && prev < srcLength);
-
-        return tokens;
-    };
-
     auto remove_type_from_name = [](const std::string& name) -> std::string {
         auto it = std::find(name.begin(), name.end(), ':');
         if (it == name.end() || (it + 1) == name.end())
@@ -246,22 +225,13 @@ std::shared_ptr<ngraph::Function> CLDNNGraph::GetExecGraphInfoByPrimitivesInfo(s
         return std::string((it+1), name.end());
     };
 
+    auto extIdMap = GetNetwork()->get_ext_id_mapping();
+
     auto find_origin_layers = [&](const std::string& name) -> std::vector<std::string> {
-        if (primitivesToIRLayersMap.find(name) == primitivesToIRLayersMap.end())
+        if (extIdMap.find(name) == extIdMap.end()) {
             return {};
-
-        auto cnn_names = primitivesToIRLayersMap.at(name);
-        std::vector<std::string> res;
-
-        for (auto& cnn_name : cnn_names) {
-            if (IRToNgraphLayersMap.find(cnn_name) != IRToNgraphLayersMap.end()) {
-                auto ngraph_names = split_string(IRToNgraphLayersMap.at(cnn_name));
-                res.insert(res.end(), ngraph_names.begin(), ngraph_names.end());
-            } else {
-                res.push_back(cnn_name);
-            }
         }
-        return res;
+        return { extIdMap.at(name) };
     };
 
     auto get_inputs = [&] (const cldnn::primitive_info& prim_info) {
@@ -599,13 +569,21 @@ std::map<std::string, InferenceEngine::InferenceEngineProfileInfo> CLDNNGraph::G
     auto allIds = GetNetwork()->get_all_primitive_org_ids();
     auto executedPrimitives = GetNetwork()->get_executed_primitives();
     auto primitivesInfo = GetNetwork()->get_primitives_info();
+    auto extIdMap = GetNetwork()->get_ext_id_mapping();
 
-    auto getUpperCaseName = [&](std::string name) {
+    auto getUpperCaseName = [](std::string name) {
         if (name.length() > 0)
             name[0] = toupper(name[0]);
         return name;
     };
 
+    auto getClearName = [](std::string name) {
+        if (name.find(":") != std::string::npos) {
+            name = name.substr(name.find(":") + 1, name.length());
+        }
+        return name;
+    };
+
     auto getFromProfiling = [&](std::string primId) -> bool {
         auto perfIter = perfMap.find(primId);
 
@@ -696,10 +674,7 @@ std::map<std::string, InferenceEngine::InferenceEngineProfileInfo> CLDNNGraph::G
                 }
             }
 
-            std::string layerName = primId;
-            if (primId.find(":") != std::string::npos) {
-                layerName = primId.substr(primId.find(":") + 1, primId.length());
-            }
+            std::string layerName = getClearName(primId);
 
             for (auto& pi : primitivesInfo) {
                 if (pi.original_id == primId) {
@@ -735,10 +710,27 @@ std::map<std::string, InferenceEngine::InferenceEngineProfileInfo> CLDNNGraph::G
     }
 
     // Step 3. Checking primitives which has been deleted from execution order but added by clDNNPlugin
-    for (auto& primId : profilingIDs)
+    for (auto& primId : profilingIDs) {
         if (std::find(allIds.begin(), allIds.end(), primId) == allIds.end()) {
             getFromProfiling(primId);
         }
+    }
+
+    for (auto& p : extIdMap) {
+        if (p.first.find(p.second) != std::string::npos) {
+            continue;
+        }
+        auto first_res = result.find(getClearName(p.first));
+        auto second_res = result.find(getClearName(p.second));
+
+        if (first_res != result.end() && second_res != result.end() && first_res != second_res) {
+            std::swap(first_res->second.cpu_uSec,        second_res->second.cpu_uSec);
+            std::swap(first_res->second.realTime_uSec,   second_res->second.realTime_uSec);
+            std::swap(first_res->second.status,          second_res->second.status);
+            std::swap(first_res->second.exec_type,       second_res->second.exec_type);
+            std::swap(first_res->second.execution_index, second_res->second.execution_index);
+        }
+    }
     return result;
 }
 
diff --git a/inference-engine/src/cldnn_engine/cldnn_graph.h b/inference-engine/src/cldnn_engine/cldnn_graph.h
index 206c58aaccd..d220c4009f5 100644
--- a/inference-engine/src/cldnn_engine/cldnn_graph.h
+++ b/inference-engine/src/cldnn_engine/cldnn_graph.h
@@ -61,8 +61,6 @@ protected:
     InferenceEngine::gpu::ClContext::Ptr m_context;
     std::vector<std::shared_ptr<cldnn::network>> m_networks;
     std::map<std::string, cldnn::primitive_id> primitiveIDs;
-    std::map<cldnn::primitive_id, std::vector<std::string>> primitivesToIRLayersMap;
-    std::map<cldnn::primitive_id, std::string> IRToNgraphLayersMap;
     std::map<std::string, std::vector<cldnn::primitive_id>> prevPrimitiveIDs;
 
     std::map<cldnn::primitive_id, std::pair<std::string, PerfCounter>> perfMap;
diff --git a/inference-engine/src/cldnn_engine/cldnn_infer_request.cpp b/inference-engine/src/cldnn_engine/cldnn_infer_request.cpp
index 9a55217975c..6c0e2527eac 100644
--- a/inference-engine/src/cldnn_engine/cldnn_infer_request.cpp
+++ b/inference-engine/src/cldnn_engine/cldnn_infer_request.cpp
@@ -12,6 +12,7 @@
 #include "cldnn_remote_context.h"
 #include "cldnn_executable_network.h"
 #include "cldnn_itt.h"
+#include "cldnn/runtime/debug_configuration.hpp"
 #include <ie_algorithm.hpp>
 #include <debug.h>
 
@@ -622,6 +623,10 @@ void CLDNNInferRequest::allocate_inputs() {
                 IE_THROW() << "Input layout for " << name << " is not found";
             }
 
+            GPU_DEBUG_GET_INSTANCE(debug_config);
+            GPU_DEBUG_IF(debug_config->verbose >= 2) {
+                GPU_DEBUG_COUT << "[" << name << ": input blob]" << std::endl;
+            }
             if (desc.getPrecision() == Precision::I16 || desc.getPrecision() == Precision::U16) {
                 TensorDesc desc_fp32 = desc;
                 desc_fp32.setPrecision(Precision::FP32);
@@ -673,6 +678,10 @@ void CLDNNInferRequest::allocate_outputs() {
         const cldnn::layout output_layout = m_graph->GetNetwork()->get_output_memory(outputID)->get_layout();
         const TensorDesc& desc = no.second->getTensorDesc();
 
+        GPU_DEBUG_GET_INSTANCE(debug_config);
+        GPU_DEBUG_IF(debug_config->verbose >= 2) {
+            GPU_DEBUG_COUT << "[" << no.first << ": output blob]" << std::endl;
+        }
         auto blobPtr = create_device_blob(desc, output_layout);
         _deviceOutputs[no.first] = blobPtr;
         _outputs[no.first] = blobPtr;
diff --git a/inference-engine/src/cldnn_engine/cldnn_program.cpp b/inference-engine/src/cldnn_engine/cldnn_program.cpp
index 7386501f0b1..22a55d743bd 100644
--- a/inference-engine/src/cldnn_engine/cldnn_program.cpp
+++ b/inference-engine/src/cldnn_engine/cldnn_program.cpp
@@ -284,14 +284,12 @@ std::vector<cldnn::primitive_id> Program::GetInputPrimitiveIDs(const std::shared
 void Program::AddPrimitiveToProfiler(const std::shared_ptr<ngraph::Node>& op,
                                      cldnn::primitive_id customOutputId) {
     auto id = layer_type_name_ID(op);
-    primitivesToIRLayersMap[id] = { op->get_friendly_name() };
     primitiveIDs[id] = customOutputId.empty() ? id : customOutputId;
     profilingIDs.push_back(id);
 }
 
 void Program::AddPrimitiveToProfiler(cldnn::primitive_id id, const std::shared_ptr<ngraph::Node>& op,
                                      cldnn::primitive_id customOutputId) {
-    primitivesToIRLayersMap[id] = { op->get_friendly_name() };
     primitiveIDs[id] = customOutputId.empty() ? id : customOutputId;
     profilingIDs.push_back(id);
 }
@@ -299,7 +297,6 @@ void Program::AddPrimitiveToProfiler(cldnn::primitive_id id, const std::shared_p
 void Program::AddInnerPrimitiveToProfiler(cldnn::primitive_id id, cldnn::primitive_id parentId,
                                           const std::shared_ptr<ngraph::Node>& op) {
     InitProfileInfo(id, layer_type_lower(op), false, InferenceEngine::InferenceEngineProfileInfo::EXECUTED, parentId);
-    primitivesToIRLayersMap[id] = { op->get_friendly_name() };
     primitiveIDs[id] = id;
     profilingIDs.push_back(id);
 }
@@ -328,28 +325,24 @@ void Program::InitProfileInfo(const std::string& layerName,
 
 // TODO: Does it make sense to add such method to ngraph core?
 bool IsNodeOnConstPath(const std::shared_ptr<ngraph::Node>& node) {
-    std::list<std::shared_ptr<ngraph::Node>> nodes_to_process = { node };
-    while (!nodes_to_process.empty()) {
-        auto current_node = nodes_to_process.front();
-        nodes_to_process.pop_front();
-
-        for (size_t i = 0; i < current_node->get_input_size(); i++) {
-            auto input_node = current_node->get_input_node_shared_ptr(i);
-
-            // If input is constant, then drop if from the processing list
-            if (std::dynamic_pointer_cast<ngraph::op::v0::Constant>(input_node) != nullptr)
-                continue;
-
-            // If the node doesn't have any parents and it's not a constant, then we deal with dynamic path
-            if (input_node->get_input_size() == 0) {
+    std::set<std::shared_ptr<ngraph::Node>> nodes_processed = {};
+    std::function<bool(const std::shared_ptr<ngraph::Node>&)> is_const_node = [&nodes_processed, &is_const_node](const std::shared_ptr<ngraph::Node>& node) {
+        if (nodes_processed.count(node)) return true;
+        nodes_processed.insert(node);
+        // If input is constant, then drop if from the processing list
+        if (std::dynamic_pointer_cast<ngraph::op::v0::Constant>(node) != nullptr)
+            return true;
+        // If the node doesn't have any parents and it's not a constant, then we deal with dynamic path
+        if (node->get_input_size() == 0)
+            return false;
+        for (size_t i = 0; i < node->get_input_size(); i++) {
+            auto input_node = node->get_input_node_shared_ptr(i);
+            if (!is_const_node(input_node))
                 return false;
-            }
-
-            nodes_to_process.insert(nodes_to_process.end(), input_node);
         }
-    }
-
-    return true;
+        return true;
+    };
+    return is_const_node(node);
 }
 
 }  // namespace CLDNNPlugin
diff --git a/inference-engine/src/cldnn_engine/cldnn_program.h b/inference-engine/src/cldnn_engine/cldnn_program.h
index 23b6313cac9..f499104a9b9 100644
--- a/inference-engine/src/cldnn_engine/cldnn_program.h
+++ b/inference-engine/src/cldnn_engine/cldnn_program.h
@@ -76,8 +76,6 @@ public:
     static const cldnn::primitive_id m_postCustomLayerTag;
 
     std::map<std::string, cldnn::primitive_id> primitiveIDs;
-    std::map<cldnn::primitive_id, std::vector<std::string>> primitivesToIRLayersMap;
-    std::map<cldnn::primitive_id, std::string> IRToNgraphLayersMap;
     std::map<std::string, std::vector<cldnn::primitive_id>> prevPrimitiveIDs;
     std::map<cldnn::primitive_id, std::pair<std::string, PerfCounter>> perfMap;
 
diff --git a/inference-engine/src/cldnn_engine/ops/batch_to_space.cpp b/inference-engine/src/cldnn_engine/ops/batch_to_space.cpp
index e46643f0617..d67f9e9888a 100644
--- a/inference-engine/src/cldnn_engine/ops/batch_to_space.cpp
+++ b/inference-engine/src/cldnn_engine/ops/batch_to_space.cpp
@@ -42,7 +42,8 @@ void CreateBatchToSpaceOp(Program& p, const std::shared_ptr<ngraph::op::v1::Batc
                                                   inputs[0], // block_shape
                                                   inputs[1], // crops_begin
                                                   inputs[2], // crops_end
-                                                  out_size);
+                                                  out_size,
+                                                  op->get_friendly_name());
 
     p.AddPrimitive(batchToSpacePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/broadcast.cpp b/inference-engine/src/cldnn_engine/ops/broadcast.cpp
index 6d6e6303200..16264a31fea 100644
--- a/inference-engine/src/cldnn_engine/ops/broadcast.cpp
+++ b/inference-engine/src/cldnn_engine/ops/broadcast.cpp
@@ -31,8 +31,13 @@ static void CreateCommonBroadcastOp(Program& p, const std::shared_ptr<ngraph::No
         if (targetFormat.value != DefaultFormatForDims(inputRank).value) {
             auto reorderName = layerName + "_cldnn_in_reorder";
             auto targetDatatype = DataTypeFromPrecision(op->get_input_element_type(0));
-            auto reorderPrim = cldnn::reorder(reorderName, inputPrimitive, targetFormat, targetDatatype);
-
+            auto reorderPrim = cldnn::reorder(reorderName,
+                                              inputPrimitive,
+                                              targetFormat,
+                                              targetDatatype,
+                                              std::vector<float>(),
+                                              cldnn::reorder_mean_mode::subtract,
+                                              op->get_friendly_name());
             p.AddPrimitive(reorderPrim);
             p.AddInnerPrimitiveToProfiler(reorderName, layerName, op);
 
@@ -66,7 +71,7 @@ static void CreateCommonBroadcastOp(Program& p, const std::shared_ptr<ngraph::No
 
         auto targetShape = CldnnTensorFromIEDims(inputShape);
 
-        auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitive, targetShape);
+        auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitive, targetShape, op->get_friendly_name());
         p.AddPrimitive(reshapePrim);
         p.AddInnerPrimitiveToProfiler(reshapeName, layerName, op);
 
@@ -75,7 +80,9 @@ static void CreateCommonBroadcastOp(Program& p, const std::shared_ptr<ngraph::No
 
     auto broadcastPrim = cldnn::broadcast(layerName,
                                           inputPrimitive,
-                                          CldnnTensorFromIEDims(op->get_output_shape(0)));
+                                          CldnnTensorFromIEDims(op->get_output_shape(0)),
+                                          {},
+                                          op->get_friendly_name());
 
     p.AddPrimitive(broadcastPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/concat.cpp b/inference-engine/src/cldnn_engine/ops/concat.cpp
index 453e9996530..fc1e51d1981 100644
--- a/inference-engine/src/cldnn_engine/ops/concat.cpp
+++ b/inference-engine/src/cldnn_engine/ops/concat.cpp
@@ -45,7 +45,8 @@ void CreateConcatOp(Program& p, const std::shared_ptr<ngraph::op::v0::Concat>& o
         layerName,
         inputPrimitives,
         GetConcatAxis(op->get_axis(), op->get_input_shape(0).size()),
-        DataTypeFromPrecision(op->get_output_element_type(0)));
+        DataTypeFromPrecision(op->get_output_element_type(0)),
+        op->get_friendly_name());
 
     p.AddPrimitive(concatPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/constant.cpp b/inference-engine/src/cldnn_engine/ops/constant.cpp
index fea42f31d98..58bc0a18d4a 100644
--- a/inference-engine/src/cldnn_engine/ops/constant.cpp
+++ b/inference-engine/src/cldnn_engine/ops/constant.cpp
@@ -18,6 +18,7 @@
 #include "ngraph/op/util/op_types.hpp"
 
 #include "cldnn/primitives/data.hpp"
+#include "cldnn/runtime/debug_configuration.hpp"
 
 namespace CLDNNPlugin {
 
@@ -169,6 +170,10 @@ void CreateConstantOp(Program& p, const std::shared_ptr<ngraph::op::v0::Constant
     if (bufIter != p.blobMemCache.end()) {
         constPrimID = bufIter->second;
     } else {
+        GPU_DEBUG_GET_INSTANCE(debug_config);
+        GPU_DEBUG_IF(debug_config->verbose >= 2) {
+            GPU_DEBUG_COUT << "[" << initialconstPrimID << ": constant]" << std::endl;
+        }
         cldnn::memory::ptr mem = p.GetEngine().allocate_memory(constLayout, false);
         auto& stream = p.GetEngine().get_program_stream();
         cldnn::mem_lock<char> lock{mem, stream};
@@ -199,7 +204,7 @@ void CreateConstantOp(Program& p, const std::shared_ptr<ngraph::op::v0::Constant
         } else {
             std::memcpy(&buf[0], &data[0], bufSize);
         }
-        p.AddPrimitive(cldnn::data(initialconstPrimID, mem));
+        p.AddPrimitive(cldnn::data(initialconstPrimID, mem, op->get_friendly_name()));
         p.blobMemCache[std::make_pair(data, constDims)] = initialconstPrimID;
         constPrimID = initialconstPrimID;
     }
diff --git a/inference-engine/src/cldnn_engine/ops/convert.cpp b/inference-engine/src/cldnn_engine/ops/convert.cpp
index 6af5bee759d..603eb26abeb 100644
--- a/inference-engine/src/cldnn_engine/ops/convert.cpp
+++ b/inference-engine/src/cldnn_engine/ops/convert.cpp
@@ -19,8 +19,13 @@ void CreateConvertLikeOp(Program& p, const std::shared_ptr<ngraph::op::v1::Conve
 
     auto outDataType = DataTypeFromPrecision(op->get_input_element_type(1));
 
-    auto reorderPrim = cldnn::reorder(layerName, inputPrimitives[0], cldnn::format::any, outDataType);
-
+    auto reorderPrim = cldnn::reorder(layerName,
+                                      inputPrimitives[0],
+                                      cldnn::format::any,
+                                      outDataType,
+                                      std::vector<float>(),
+                                      cldnn::reorder_mean_mode::subtract,
+                                      op->get_friendly_name());
     p.AddPrimitive(reorderPrim);
     p.AddPrimitiveToProfiler(op);
 }
@@ -32,7 +37,13 @@ void CreateConvertOp(Program& p, const std::shared_ptr<ngraph::op::v0::Convert>&
 
     auto outDataType = DataTypeFromPrecision(op->get_destination_type());
 
-    auto reorderPrim = cldnn::reorder(layerName, inputPrimitives[0], cldnn::format::any, outDataType);
+    auto reorderPrim = cldnn::reorder(layerName,
+                                      inputPrimitives[0],
+                                      cldnn::format::any,
+                                      outDataType,
+                                      std::vector<float>(),
+                                      cldnn::reorder_mean_mode::subtract,
+                                      op->get_friendly_name());
 
     p.AddPrimitive(reorderPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/convolution.cpp b/inference-engine/src/cldnn_engine/ops/convolution.cpp
index 83f536a68b7..e8c44693dbd 100644
--- a/inference-engine/src/cldnn_engine/ops/convolution.cpp
+++ b/inference-engine/src/cldnn_engine/ops/convolution.cpp
@@ -84,7 +84,8 @@ void CreateGroupConvolutionOp(Program& p, const std::shared_ptr<ngraph::op::v1::
                                        params.dilation,
                                        CldnnTensorFromIEDims(outDims),
                                        DataTypeFromPrecision(outPrecision),
-                                       weights_have_group_dim);
+                                       weights_have_group_dim,
+                                       op->get_friendly_name());
 
     p.AddPrimitive(convPrim);
     p.AddPrimitiveToProfiler(op);
@@ -112,7 +113,8 @@ void CreateConvolutionOp(Program& p, const std::shared_ptr<ngraph::op::v1::Convo
                                        params.dilation,
                                        CldnnTensorFromIEDims(outDims),
                                        DataTypeFromPrecision(outPrecision),
-                                       weights_have_group_dim);
+                                       weights_have_group_dim,
+                                       op->get_friendly_name());
 
     p.AddPrimitive(convPrim);
     p.AddPrimitiveToProfiler(op);
@@ -146,7 +148,8 @@ void CreateConvolutionBackpropDataOp(Program& p, const std::shared_ptr<ngraph::o
         std::swap(permute_order[1], permute_order[0]);
         auto permutePrim = cldnn::permute(permuteName,
                                           weightsName,
-                                          ConvertPermuteOrder(permute_order, weights_rank));
+                                          ConvertPermuteOrder(permute_order, weights_rank),
+                                          op->get_friendly_name());
 
         p.AddPrimitive(permutePrim);
         p.AddInnerPrimitiveToProfiler(permuteName, layerName, op);
@@ -159,14 +162,15 @@ void CreateConvolutionBackpropDataOp(Program& p, const std::shared_ptr<ngraph::o
 
     auto params = GetConvolutionParameters(op->get_pads_begin(), op->get_dilations(), op->get_strides(), 1);
     auto deconvPrim = cldnn::deconvolution(layerName,
-        inputs[0],
-        weights,
-        {},
-        params.groups,
-        params.stride,
-        params.padding,
-        CldnnTensorFromIEDims(op->get_output_tensor(0).get_shape()),
-        weights_have_group_dim);
+                                           inputs[0],
+                                           weights,
+                                           {},
+                                           params.groups,
+                                           params.stride,
+                                           params.padding,
+                                           CldnnTensorFromIEDims(op->get_output_tensor(0).get_shape()),
+                                           weights_have_group_dim,
+                                           op->get_friendly_name());
 
     p.AddPrimitive(deconvPrim);
     p.AddPrimitiveToProfiler(op);
@@ -202,7 +206,8 @@ void CreateGroupConvolutionBackpropDataOp(Program& p, const std::shared_ptr<ngra
         std::swap(permute_order[2], permute_order[1]);
         auto permutePrim = cldnn::permute(permuteName,
                                           weightsName,
-                                          ConvertPermuteOrder(permute_order, weights_rank));
+                                          ConvertPermuteOrder(permute_order, weights_rank),
+                                          op->get_friendly_name());
 
         p.AddPrimitive(permutePrim);
         p.AddInnerPrimitiveToProfiler(permuteName, layerName, op);
@@ -214,14 +219,15 @@ void CreateGroupConvolutionBackpropDataOp(Program& p, const std::shared_ptr<ngra
     const bool weights_have_group_dim = true;
 
     auto deconvPrim = cldnn::deconvolution(layerName,
-        inputs[0],
-        weights,
-        {},
-        params.groups,
-        params.stride,
-        params.padding,
-        CldnnTensorFromIEDims(op->get_output_tensor(0).get_shape()),
-        weights_have_group_dim);
+                                           inputs[0],
+                                           weights,
+                                           {},
+                                           params.groups,
+                                           params.stride,
+                                           params.padding,
+                                           CldnnTensorFromIEDims(op->get_output_tensor(0).get_shape()),
+                                           weights_have_group_dim,
+                                           op->get_friendly_name());
 
     p.AddPrimitive(deconvPrim);
     p.AddPrimitiveToProfiler(op);
@@ -247,7 +253,8 @@ void CreateDeformableConvolutionOp(Program& p, const std::shared_ptr<ngraph::op:
                                            params.stride,
                                            params.padding,
                                            params.dilation,
-                                           CldnnTensorFromIEDims(outDims));
+                                           CldnnTensorFromIEDims(outDims),
+                                           op->get_friendly_name());
 
         p.AddPrimitive(convPrim);
         p.AddPrimitiveToProfiler(op);
@@ -280,7 +287,8 @@ void CreateDeformableConvolutionOp(Program& p, const std::shared_ptr<ngraph::op:
                                                           params.padding,
                                                           params.dilation,
                                                           CldnnTensorFromIEDims(outDims),
-                                                          kernel);
+                                                          kernel,
+                                                          op->get_friendly_name());
         p.AddPrimitive(defConvPrimInterp);
         p.AddInnerPrimitiveToProfiler(defConvLayerNameInterp, defConvLayerNameConv, op);
         auto defConvPrim = cldnn::deformable_conv(defConvLayerNameConv,
@@ -288,7 +296,8 @@ void CreateDeformableConvolutionOp(Program& p, const std::shared_ptr<ngraph::op:
                                                   weights,
                                                   {},
                                                   params.groups,
-                                                  CldnnTensorFromIEDims(outDims));
+                                                  CldnnTensorFromIEDims(outDims),
+                                                  op->get_friendly_name());
         p.AddPrimitive(defConvPrim);
         p.AddPrimitiveToProfiler(defConvLayerNameConv, op);
     }
@@ -313,7 +322,8 @@ void CreateBinaryConvolutionOp(Program& p, const std::shared_ptr<ngraph::op::v1:
                                               CldnnTensorFromIEDims(outDims),
                                               params.groups,
                                               op->get_pad_value(),
-                                              calc_precision);
+                                              calc_precision,
+                                              op->get_friendly_name());
 
     p.AddPrimitive(convPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/ctc_greedy_decoder.cpp b/inference-engine/src/cldnn_engine/ops/ctc_greedy_decoder.cpp
index c8bd8d54e07..4ff72462a47 100644
--- a/inference-engine/src/cldnn_engine/ops/ctc_greedy_decoder.cpp
+++ b/inference-engine/src/cldnn_engine/ops/ctc_greedy_decoder.cpp
@@ -11,6 +11,7 @@
 #include "cldnn/primitives/ctc_greedy_decoder.hpp"
 #include "cldnn/primitives/reorder.hpp"
 #include "cldnn/primitives/mutable_data.hpp"
+#include "cldnn/runtime/debug_configuration.hpp"
 
 #include "transformations/utils/utils.hpp"
 
@@ -33,7 +34,10 @@ void CreateCommonCTCGreedyDecoderOp(Program& p, const std::shared_ptr<ngraph::No
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
             reorderedInputs[portIndex] = (reorderPrimName);
@@ -70,11 +74,16 @@ void CreateCommonCTCGreedyDecoderOp(Program& p, const std::shared_ptr<ngraph::No
             DefaultFormatForDims(op->get_output_shape(1).size()),
             CldnnTensorFromIEDims(op->get_output_shape(1)));
 
+        GPU_DEBUG_GET_INSTANCE(debug_config);
+        GPU_DEBUG_IF(debug_config->verbose >= 2) {
+            GPU_DEBUG_COUT << "[" << layer_type_name_ID(op) << ": mutable data]" << std::endl;
+        }
         shared_memory.emplace_back(p.GetEngine().allocate_memory(mutableLayout));
 
         cldnn::primitive_id ctc_gd_mutable_id_w = layer_type_name_ID(op) + "_md_write";
-        auto ctc_gd_mutable_prim = cldnn::mutable_data(ctc_gd_mutable_id_w, shared_memory[0]);
-        p.primitivesToIRLayersMap[ctc_gd_mutable_id_w] = { op->get_friendly_name() };
+        auto ctc_gd_mutable_prim = cldnn::mutable_data(ctc_gd_mutable_id_w,
+                                                       shared_memory[0],
+                                                       op->get_friendly_name());
         p.primitiveIDs[ctc_gd_mutable_id_w] = ctc_gd_mutable_id_w;
         p.AddPrimitive(ctc_gd_mutable_prim);
         reorderedInputs.push_back(ctc_gd_mutable_id_w);
@@ -86,7 +95,8 @@ void CreateCommonCTCGreedyDecoderOp(Program& p, const std::shared_ptr<ngraph::No
                 reorderedInputs,
                 blank_index,
                 ctc_merge_repeated,
-                CldnnTensorFromIEDims(op->get_output_shape(0)));
+                CldnnTensorFromIEDims(op->get_output_shape(0)),
+                op->get_friendly_name());
 
     // clDNN primitive supports only i32 as output data type
     primitive.output_data_type = DataTypeFromPrecision(ngraph::element::i32);
@@ -99,8 +109,10 @@ void CreateCommonCTCGreedyDecoderOp(Program& p, const std::shared_ptr<ngraph::No
 
     if (num_output == 2) {
         cldnn::primitive_id ctc_gd_mutable_id_r = layer_type_name_ID(op) + ".1";
-        auto ctc_gd_mutable_prim_r = cldnn::mutable_data(ctc_gd_mutable_id_r, { CTCGreedyDecoderLayerName }, shared_memory[0]);
-        p.primitivesToIRLayersMap[ctc_gd_mutable_id_r] = { op->get_friendly_name() };
+        auto ctc_gd_mutable_prim_r = cldnn::mutable_data(ctc_gd_mutable_id_r,
+                                                         { CTCGreedyDecoderLayerName },
+                                                         shared_memory[0],
+                                                         op->get_friendly_name());
         p.primitiveIDs[ctc_gd_mutable_id_r] = ctc_gd_mutable_id_r;
         p.AddPrimitive(ctc_gd_mutable_prim_r);
     }
diff --git a/inference-engine/src/cldnn_engine/ops/cum_sum.cpp b/inference-engine/src/cldnn_engine/ops/cum_sum.cpp
index 1bdcec2957e..9f8e2a463f2 100644
--- a/inference-engine/src/cldnn_engine/ops/cum_sum.cpp
+++ b/inference-engine/src/cldnn_engine/ops/cum_sum.cpp
@@ -63,7 +63,8 @@ void CreateCumSumOp(Program& p, const std::shared_ptr<ngraph::op::v0::CumSum>& o
                                     inputPrimitives[0],
                                     GetCumSumAxis(axis, rank),
                                     exclusive,
-                                    reverse);
+                                    reverse,
+                                    op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/custom.cpp b/inference-engine/src/cldnn_engine/ops/custom.cpp
index 85945bfbdb9..c967100d1f9 100644
--- a/inference-engine/src/cldnn_engine/ops/custom.cpp
+++ b/inference-engine/src/cldnn_engine/ops/custom.cpp
@@ -145,7 +145,10 @@ void CreateCustomOp(Program& p, const std::shared_ptr<ngraph::Node>& op, CLDNNCu
                         reorderPrimName,
                         inputPrimitives[param.portIndex],
                         param.format,
-                        DataTypeFromPrecision(op->get_input_element_type(param.portIndex)));
+                        DataTypeFromPrecision(op->get_input_element_type(param.portIndex)),
+                        std::vector<float>(),
+                        cldnn::reorder_mean_mode::subtract,
+                        op->get_friendly_name());
 
                     p.AddPrimitive(preprocessPrim);
                     p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
@@ -229,7 +232,8 @@ void CreateCustomOp(Program& p, const std::shared_ptr<ngraph::Node>& op, CLDNNCu
                                                   customLayer->CompilerOptions(),
                                                   outputLayout,
                                                   gws,
-                                                  lws);
+                                                  lws,
+                                                  op->get_friendly_name());
 
     auto prevLayerName = genericLayerName;
     if (outputLayout.format != cldnn::format::any) {
@@ -239,7 +243,10 @@ void CreateCustomOp(Program& p, const std::shared_ptr<ngraph::Node>& op, CLDNNCu
             cldnn::reorder(reorderPrimName,
                            genericLayerName,
                            DefaultFormatForDims(op->get_output_shape(0).size()),
-                           customPrim.output_layout.data_type));
+                           customPrim.output_layout.data_type,
+                           std::vector<float>(),
+                           cldnn::reorder_mean_mode::subtract,
+                           op->get_friendly_name()));
         prevLayerName = reorderPrimName;
         p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
     }
diff --git a/inference-engine/src/cldnn_engine/ops/depth_to_space.cpp b/inference-engine/src/cldnn_engine/ops/depth_to_space.cpp
index b53262ab23d..aa762a356d7 100644
--- a/inference-engine/src/cldnn_engine/ops/depth_to_space.cpp
+++ b/inference-engine/src/cldnn_engine/ops/depth_to_space.cpp
@@ -33,7 +33,8 @@ void CreateDepthToSpaceOp(Program& p, const std::shared_ptr<ngraph::op::v0::Dept
     auto depthToSpacePrim = cldnn::depth_to_space(layerName,
                                                   inputPrimitives[0],
                                                   blockSize,
-                                                  mode);
+                                                  mode,
+                                                  op->get_friendly_name());
 
     p.AddPrimitive(depthToSpacePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/detection_output.cpp b/inference-engine/src/cldnn_engine/ops/detection_output.cpp
index aa2b505f0e7..80616090655 100644
--- a/inference-engine/src/cldnn_engine/ops/detection_output.cpp
+++ b/inference-engine/src/cldnn_engine/ops/detection_output.cpp
@@ -75,7 +75,8 @@ void CreateDetectionOutputOp(Program& p, const std::shared_ptr<ngraph::op::v0::D
                                                  input_height,
                                                  decrease_label_id,
                                                  clip_before_nms,
-                                                 clip_after_nms);
+                                                 clip_after_nms,
+                                                 op->get_friendly_name());
 
     p.AddPrimitive(detectionPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/eltwise.cpp b/inference-engine/src/cldnn_engine/ops/eltwise.cpp
index 817512d5bf9..f486bff593d 100644
--- a/inference-engine/src/cldnn_engine/ops/eltwise.cpp
+++ b/inference-engine/src/cldnn_engine/ops/eltwise.cpp
@@ -46,7 +46,13 @@ void CreateElementwiseOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cl
             if (targetFormat.value != DefaultFormatForDims(inputRank).value) {
                 auto reorderName = layerName + "_cldnn_in" + std::to_string(i) + "_reorder";
                 auto targetDatatype = DataTypeFromPrecision(op->get_input_element_type(i));
-                auto reorderPrim = cldnn::reorder(reorderName, inputPrimitives[i], targetFormat, targetDatatype);
+                auto reorderPrim = cldnn::reorder(reorderName,
+                                                  inputPrimitives[i],
+                                                  targetFormat,
+                                                  targetDatatype,
+                                                  std::vector<float>(),
+                                                  cldnn::reorder_mean_mode::subtract,
+                                                  op->get_friendly_name());
 
                 p.AddPrimitive(reorderPrim);
                 p.AddInnerPrimitiveToProfiler(reorderName, layerName, op);
@@ -61,7 +67,7 @@ void CreateElementwiseOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cl
 
             auto targetShape = CldnnTensorFromIEDims(inputShape);
 
-            auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape);
+            auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape, op->get_friendly_name());
             p.AddPrimitive(reshapePrim);
             p.AddInnerPrimitiveToProfiler(reshapeName, layerName, op);
 
@@ -74,7 +80,8 @@ void CreateElementwiseOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cl
                                       inputPrimitives,
                                       mode,
                                       {},
-                                      out_dt);
+                                      out_dt,
+                                      op->get_friendly_name());
 
     p.AddPrimitive(eltwisePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/embedding_bag.cpp b/inference-engine/src/cldnn_engine/ops/embedding_bag.cpp
index 2e97a60aebf..369c0eca44a 100644
--- a/inference-engine/src/cldnn_engine/ops/embedding_bag.cpp
+++ b/inference-engine/src/cldnn_engine/ops/embedding_bag.cpp
@@ -49,7 +49,10 @@ void CreateEmbeddingBagOffsetsSumOp(Program& p, const std::shared_ptr<ngraph::op
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
             reorderedInputs[portIndex] = (reorderPrimName);
@@ -62,7 +65,8 @@ void CreateEmbeddingBagOffsetsSumOp(Program& p, const std::shared_ptr<ngraph::op
                                                  reorderedInputs,
                                                  cldnn::embedding_bag::offsets_sum,
                                                  CldnnTensorFromIEDims(op->get_output_shape(0)),
-                                                 defaultIndex);
+                                                 defaultIndex,
+                                                 op->get_friendly_name());
 
     p.AddPrimitive(embeddingBagPrim);
     p.AddPrimitiveToProfiler(op);
@@ -86,7 +90,10 @@ void CreateEmbeddingBagPackedSumOp(Program& p, const std::shared_ptr<ngraph::op:
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
             reorderedInputs[portIndex] = (reorderPrimName);
@@ -98,7 +105,9 @@ void CreateEmbeddingBagPackedSumOp(Program& p, const std::shared_ptr<ngraph::op:
     auto embeddingBagPrim = cldnn::embedding_bag(layerName,
                                                  reorderedInputs,
                                                  cldnn::embedding_bag::packed_sum,
-                                                 CldnnTensorFromIEDims(op->get_output_shape(0)));
+                                                 CldnnTensorFromIEDims(op->get_output_shape(0)),
+                                                 -1,
+                                                 op->get_friendly_name());
 
     p.AddPrimitive(embeddingBagPrim);
     p.AddPrimitiveToProfiler(op);
@@ -140,7 +149,10 @@ void CreateEmbeddingSegmentsSumOp(Program& p, const std::shared_ptr<ngraph::op::
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
             reorderedInputs[portIndex] = (reorderPrimName);
@@ -153,7 +165,8 @@ void CreateEmbeddingSegmentsSumOp(Program& p, const std::shared_ptr<ngraph::op::
                                                  reorderedInputs,
                                                  cldnn::embedding_bag::segments_sum,
                                                  CldnnTensorFromIEDims(op->get_output_shape(0)),
-                                                 defaultIndex);
+                                                 defaultIndex,
+                                                 op->get_friendly_name());
 
     p.AddPrimitive(embeddingBagPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/extract_image_patches.cpp b/inference-engine/src/cldnn_engine/ops/extract_image_patches.cpp
index 23b5f014320..088a0fcd413 100644
--- a/inference-engine/src/cldnn_engine/ops/extract_image_patches.cpp
+++ b/inference-engine/src/cldnn_engine/ops/extract_image_patches.cpp
@@ -38,7 +38,8 @@ void CreateExtractImagePatchesOp(Program& p, const std::shared_ptr<ngraph::op::v
                                                                 strides,
                                                                 rates,
                                                                 auto_pad,
-                                                                CldnnTensorFromIEDims(op->get_output_shape(0)));
+                                                                CldnnTensorFromIEDims(op->get_output_shape(0)),
+                                                                op->get_friendly_name());
 
     p.AddPrimitive(extractImagePatchesPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/fake_quantize.cpp b/inference-engine/src/cldnn_engine/ops/fake_quantize.cpp
index 345a70f34bb..52ea33e5d3d 100644
--- a/inference-engine/src/cldnn_engine/ops/fake_quantize.cpp
+++ b/inference-engine/src/cldnn_engine/ops/fake_quantize.cpp
@@ -31,7 +31,8 @@ void CreateFakeQuantizeOp(Program& p, const std::shared_ptr<ngraph::op::v0::Fake
                                             output_low_id,
                                             output_high_id,
                                             levels,
-                                            dt);
+                                            dt,
+                                            op->get_friendly_name());
 
     p.AddPrimitive(quantizationPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/gather tree.cpp b/inference-engine/src/cldnn_engine/ops/gather tree.cpp
index 6b73131fd29..5476aa40d97 100644
--- a/inference-engine/src/cldnn_engine/ops/gather tree.cpp	
+++ b/inference-engine/src/cldnn_engine/ops/gather tree.cpp	
@@ -30,7 +30,10 @@ void CreateGatherTreeOp(Program& p, const std::shared_ptr<ngraph::op::v1::Gather
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layerName, op);
             reorderedInputs[portIndex] = reorderPrimName;
@@ -43,7 +46,8 @@ void CreateGatherTreeOp(Program& p, const std::shared_ptr<ngraph::op::v1::Gather
                                              reorderedInputs[0],
                                              reorderedInputs[1],
                                              reorderedInputs[2],
-                                             reorderedInputs[3]);
+                                             reorderedInputs[3],
+                                             op->get_friendly_name());
 
     p.AddPrimitive(gatherTreePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/gather.cpp b/inference-engine/src/cldnn_engine/ops/gather.cpp
index d22258e0673..bcf632f3194 100644
--- a/inference-engine/src/cldnn_engine/ops/gather.cpp
+++ b/inference-engine/src/cldnn_engine/ops/gather.cpp
@@ -77,7 +77,10 @@ void CreateGatherOpBase(Program& p, const std::shared_ptr<T>& op, const int64_t
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layerName, op);
             reorderedInputs[portIndex] = reorderPrimName;
@@ -94,7 +97,8 @@ void CreateGatherOpBase(Program& p, const std::shared_ptr<T>& op, const int64_t
                                     outLayout,
                                     CldnnTensorFromIEDims(op->get_output_shape(0)),
                                     batch_dim,
-                                    support_neg_ind);
+                                    support_neg_ind,
+                                    op->get_friendly_name());
 
     p.AddPrimitive(gatherPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/gather_elements.cpp b/inference-engine/src/cldnn_engine/ops/gather_elements.cpp
index d6138280750..50c25c37f1c 100644
--- a/inference-engine/src/cldnn_engine/ops/gather_elements.cpp
+++ b/inference-engine/src/cldnn_engine/ops/gather_elements.cpp
@@ -55,7 +55,8 @@ void CreateGatherElementsOp(Program& p, const std::shared_ptr<ngraph::op::v6::Ga
                                             inputPrimitives[1],
                                             outLayout,
                                             CldnnTensorFromIEDims(op->get_output_shape(0)),
-                                            GetGatherAxis(axis, rank));
+                                            GetGatherAxis(axis, rank),
+                                            op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/gather_nd.cpp b/inference-engine/src/cldnn_engine/ops/gather_nd.cpp
index cbdc5659bb3..266ada7f904 100644
--- a/inference-engine/src/cldnn_engine/ops/gather_nd.cpp
+++ b/inference-engine/src/cldnn_engine/ops/gather_nd.cpp
@@ -22,10 +22,11 @@ void CreateGatherNDOp(Program& p, const std::shared_ptr<ngraph::op::v5::GatherND
     auto batch_dims = op->get_batch_dims();
 
     auto primitive = cldnn::gather_nd(layerName,
-                                           inputPrimitives[0],
-                                           inputPrimitives[1],
-                                           indices_rank,
-                                           batch_dims);
+                                      inputPrimitives[0],
+                                      inputPrimitives[1],
+                                      indices_rank,
+                                      batch_dims,
+                                      op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/grn.cpp b/inference-engine/src/cldnn_engine/ops/grn.cpp
index 960dd034947..c6d07fe6191 100644
--- a/inference-engine/src/cldnn_engine/ops/grn.cpp
+++ b/inference-engine/src/cldnn_engine/ops/grn.cpp
@@ -19,7 +19,8 @@ void CreateGRNOp(Program& p, const std::shared_ptr<ngraph::op::v0::GRN>& op) {
     auto primitive = cldnn::grn(layerName,
                                 inputPrimitives[0],
                                 op->get_bias(),
-                                DataTypeFromPrecision(op->get_output_element_type(0)));
+                                DataTypeFromPrecision(op->get_output_element_type(0)),
+                                op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/interpolate.cpp b/inference-engine/src/cldnn_engine/ops/interpolate.cpp
index df99e6972ee..190032897b4 100644
--- a/inference-engine/src/cldnn_engine/ops/interpolate.cpp
+++ b/inference-engine/src/cldnn_engine/ops/interpolate.cpp
@@ -193,7 +193,8 @@ void CreateInterpolateOp(Program& p, const std::shared_ptr<ngraph::op::v4::Inter
                                         cldnnSampleType,
                                         shapeCalcMode,
                                         coordTransMode,
-                                        nearestMode);
+                                        nearestMode,
+                                        op->get_friendly_name());
 
     p.AddPrimitive(resamplePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/loop.cpp b/inference-engine/src/cldnn_engine/ops/loop.cpp
index 1ac452265b8..604f73b7e5a 100644
--- a/inference-engine/src/cldnn_engine/ops/loop.cpp
+++ b/inference-engine/src/cldnn_engine/ops/loop.cpp
@@ -29,11 +29,11 @@ using Loop = ngraph::op::v5::Loop;
 namespace CLDNNPlugin {
 
 template<class DATA_TYPE>
-static DATA_TYPE CreateScalarData(Program &p, const cldnn::primitive_id& id, int64_t num) {
+static DATA_TYPE CreateScalarData(Program &p, const cldnn::primitive_id& id, int64_t num, const cldnn::primitive_id& ext_prim_id) {
     auto mem = p.GetEngine().allocate_memory({ cldnn::data_types::i64, cldnn::format::bfyx, { 1, 1, 1, 1 } });
     cldnn::mem_lock<int64_t> ptr{mem, p.GetEngine().get_program_stream()};
     *ptr.begin() = num;
-    return {id, mem};
+    return {id, mem, ext_prim_id};
 }
 
 static cldnn::mutable_data CreateAdditionalOutputData(Program &p, const std::shared_ptr<ngraph::Node>& op,
@@ -44,7 +44,7 @@ static cldnn::mutable_data CreateAdditionalOutputData(Program &p, const std::sha
     const auto tensor = CldnnTensorFromIEDims(op->get_output_shape(output_idx));
     cldnn::layout output_layout = cldnn::layout(precision, format, tensor);
     auto mem = p.GetEngine().allocate_memory(output_layout);
-    auto md = cldnn::mutable_data(id, {input}, mem); // cldnn::data cannot set dependency
+    auto md = cldnn::mutable_data(id, {input}, mem, op->get_friendly_name()); // cldnn::data cannot set dependency
     return md;
 }
 
@@ -161,8 +161,7 @@ void CreateLoopOp(Program& p, const std::shared_ptr<Loop>& op) {
     }
     const cldnn::primitive_id num_iteration_id = layerName + "_numIteration";
     {
-        cldnn::mutable_data num_iteration = CreateScalarData<cldnn::mutable_data>(p, num_iteration_id, 0);
-        p.primitivesToIRLayersMap[num_iteration_id] = { op->get_friendly_name() };
+        cldnn::mutable_data num_iteration = CreateScalarData<cldnn::mutable_data>(p, num_iteration_id, 0, op->get_friendly_name());
         p.primitiveIDs[num_iteration_id] = num_iteration_id;
         p.AddPrimitive(num_iteration);
         p.AddInnerPrimitiveToProfiler(num_iteration_id, layerName, op);
@@ -216,7 +215,8 @@ void CreateLoopOp(Program& p, const std::shared_ptr<Loop>& op) {
         back_edges,             /* back edge mapping */
         num_iterations,         /* max iteration, i.e. length of iteration axis */
         body_current_iteration_id,
-        body_execution_condition_id);
+        body_execution_condition_id,
+        op->get_friendly_name());
 
     p.AddPrimitive(loopPrimitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/lrn.cpp b/inference-engine/src/cldnn_engine/ops/lrn.cpp
index c13c17daaeb..28e55bf038f 100644
--- a/inference-engine/src/cldnn_engine/ops/lrn.cpp
+++ b/inference-engine/src/cldnn_engine/ops/lrn.cpp
@@ -38,7 +38,8 @@ void CreateLRNOp(Program& p, const std::shared_ptr<ngraph::op::v0::LRN>& op) {
                               static_cast<float>(op->get_bias()),
                               static_cast<float>(op->get_alpha()),
                               static_cast<float>(op->get_beta()),
-                              GetNormRegion(axis_value));
+                              GetNormRegion(axis_value),
+                              op->get_friendly_name());
 
     p.AddPrimitive(lrnPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/matmul.cpp b/inference-engine/src/cldnn_engine/ops/matmul.cpp
index 3d09fc7fd4e..53b8fecd6c2 100644
--- a/inference-engine/src/cldnn_engine/ops/matmul.cpp
+++ b/inference-engine/src/cldnn_engine/ops/matmul.cpp
@@ -89,7 +89,8 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
             auto permuteName = op->get_friendly_name() + "/transpose_b";
             auto permutePrim = cldnn::permute(permuteName,
                                               weightsName,
-                                              cldnn_permute_order);
+                                              cldnn_permute_order,
+                                              op->get_friendly_name());
             p.AddPrimitive(permutePrim);
             p.AddInnerPrimitiveToProfiler(permuteName, layerName, op);
             weightsName = permuteName;
@@ -108,7 +109,8 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
             auto permuteName = op->get_friendly_name() + "/transpose_a";
             auto permutePrim = cldnn::permute(permuteName,
                                               inputName,
-                                              cldnn_permute_order);
+                                              cldnn_permute_order,
+                                              op->get_friendly_name());
             p.AddPrimitive(permutePrim);
             p.AddInnerPrimitiveToProfiler(permuteName, layerName, op);
             inputName = permuteName;
@@ -124,7 +126,10 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
                 IE_THROW() << "Inconsistent reshape in Matmul op: " << op->get_friendly_name();
 
             auto reshapeInName = op->get_friendly_name() + suffix;
-            auto reshapeInPrim = cldnn::reshape(reshapeInName, inputName, CldnnTensorFromIEDims(reshapeSize));
+            auto reshapeInPrim = cldnn::reshape(reshapeInName,
+                                                inputName,
+                                                CldnnTensorFromIEDims(reshapeSize),
+                                                op->get_friendly_name());
             p.AddPrimitive(reshapeInPrim);
             p.AddInnerPrimitiveToProfiler(reshapeInName, layerName, op);
             return reshapeInName;
@@ -144,6 +149,7 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
                                              weightsName,
                                              "",
                                              DataTypeFromPrecision(op->get_output_element_type(0)),
+                                             op->get_friendly_name(),
                                              cldnn::padding(),
                                              input_rank);
 
@@ -153,7 +159,7 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
         if (reshape_fc) {
             auto outputShape = CldnnTensorFromIEDims(op->get_output_shape(0));
             auto outReshapeName = layerName + "_cldnn_out_reshape";
-            auto outReshapePrim = cldnn::reshape(outReshapeName, layerName, outputShape);
+            auto outReshapePrim = cldnn::reshape(outReshapeName, layerName, outputShape, op->get_friendly_name());
 
             p.AddPrimitive(outReshapePrim);
             p.AddInnerPrimitiveToProfiler(outReshapeName, layerName, op);
@@ -188,7 +194,13 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
             if (targetFormat.value != DefaultFormatForDims(inputDimsN).value) {
                 auto reorderName = layerName + "_cldnn_in" + std::to_string(i) + "_reorder";
                 auto targetDatatype = DataTypeFromPrecision(op->get_output_element_type(0));
-                auto reorderPrim = cldnn::reorder(reorderName, inputPrimitives[i], targetFormat, targetDatatype);
+                auto reorderPrim = cldnn::reorder(reorderName,
+                                                  inputPrimitives[i],
+                                                  targetFormat,
+                                                  targetDatatype,
+                                                  std::vector<float>(),
+                                                  cldnn::reorder_mean_mode::subtract,
+                                                  op->get_friendly_name());
 
                 p.AddPrimitive(reorderPrim);
                 p.AddInnerPrimitiveToProfiler(reorderName, layerName, op);
@@ -227,7 +239,7 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
 
                 auto targetShape = gemmSpecificTensor(inputDims);
 
-                auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape);
+                auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape, op->get_friendly_name());
 
                 p.AddPrimitive(reshapePrim);
                 p.AddInnerPrimitiveToProfiler(reshapeName, layerName, op);
@@ -248,7 +260,8 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
                                     transA,
                                     transB,
                                     alpha,
-                                    beta);
+                                    beta,
+                                    op->get_friendly_name());
 
         p.AddPrimitive(gemmPrim);
 
@@ -258,7 +271,7 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
         if (outDimsN < 4) {
             auto outputShape = CldnnTensorFromIEDims(outDims);
             auto outReshapeName = layerName + "_cldnn_out_reshape";
-            auto outReshapePrim = cldnn::reshape(outReshapeName, layerName, outputShape);
+            auto outReshapePrim = cldnn::reshape(outReshapeName, layerName, outputShape, op->get_friendly_name());
 
             p.AddPrimitive(outReshapePrim);
             p.AddInnerPrimitiveToProfiler(outReshapeName, layerName, op);
diff --git a/inference-engine/src/cldnn_engine/ops/mvn.cpp b/inference-engine/src/cldnn_engine/ops/mvn.cpp
index b9cb376a24e..abd2128326b 100644
--- a/inference-engine/src/cldnn_engine/ops/mvn.cpp
+++ b/inference-engine/src/cldnn_engine/ops/mvn.cpp
@@ -24,7 +24,8 @@ static void CreateCommonMVNOp(Program& p, const std::shared_ptr<ngraph::Node>& o
                               normalize_variance,
                               eps,
                               eps_inside_sqrt,
-                              across_channels);
+                              across_channels,
+                              op->get_friendly_name());
 
     p.AddPrimitive(mvnPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/non_max_suppression.cpp b/inference-engine/src/cldnn_engine/ops/non_max_suppression.cpp
index 8adaa3cfa76..b5c2e05e711 100644
--- a/inference-engine/src/cldnn_engine/ops/non_max_suppression.cpp
+++ b/inference-engine/src/cldnn_engine/ops/non_max_suppression.cpp
@@ -12,6 +12,7 @@
 #include "cldnn/primitives/reorder.hpp"
 #include "cldnn/primitives/mutable_data.hpp"
 #include "cldnn/primitives/non_max_suppression.hpp"
+#include "cldnn/runtime/debug_configuration.hpp"
 
 namespace CLDNNPlugin {
 
@@ -41,7 +42,10 @@ void CreateNonMaxSuppressionIEInternalOp(Program& p, const std::shared_ptr<ngrap
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
             reorderedInputs[portIndex] = (reorderPrimName);
@@ -63,6 +67,7 @@ void CreateNonMaxSuppressionIEInternalOp(Program& p, const std::shared_ptr<ngrap
     std::size_t num_output = op->get_output_size();
 
     std::vector<cldnn::memory::ptr> shared_memory;
+    GPU_DEBUG_GET_INSTANCE(debug_config);
     switch (num_output) {
         case 3: {
             auto mutable_precision_second = op->get_output_element_type(2);
@@ -74,11 +79,15 @@ void CreateNonMaxSuppressionIEInternalOp(Program& p, const std::shared_ptr<ngrap
                 DefaultFormatForDims(op->get_output_shape(2).size()),
                 CldnnTensorFromIEDims(op->get_output_shape(2)));
 
+            GPU_DEBUG_IF(debug_config->verbose >= 2) {
+                GPU_DEBUG_COUT << "[" << layer_type_name_ID(op) << ": mutable data]" << std::endl;
+            }
             shared_memory.emplace_back(p.GetEngine().allocate_memory(mutableLayoutSecond));
 
             cldnn::primitive_id non_max_supression_mutable_id_w_second = layer_type_name_ID(op) + "_md_write_second";
-            auto nms_mutable_prim_second = cldnn::mutable_data(non_max_supression_mutable_id_w_second, shared_memory.back());
-            p.primitivesToIRLayersMap[non_max_supression_mutable_id_w_second] = { op->get_friendly_name() };
+            auto nms_mutable_prim_second = cldnn::mutable_data(non_max_supression_mutable_id_w_second,
+                                                               shared_memory.back(),
+                                                               op->get_friendly_name());
             p.primitiveIDs[non_max_supression_mutable_id_w_second] = non_max_supression_mutable_id_w_second;
             p.AddPrimitive(nms_mutable_prim_second);
             inputPrimitives.push_back(non_max_supression_mutable_id_w_second);
@@ -91,11 +100,15 @@ void CreateNonMaxSuppressionIEInternalOp(Program& p, const std::shared_ptr<ngrap
                 cldnn::format::bfyx,
                 cldnn::tensor(static_cast<int32_t>(outputIndices), 3, 1, 1));
 
+            GPU_DEBUG_IF(debug_config->verbose >= 2) {
+                GPU_DEBUG_COUT << "[" << layer_type_name_ID(op) << ": mutable data]" << std::endl;
+            }
             shared_memory.emplace_back(p.GetEngine().allocate_memory(mutableLayoutFirst));
 
             cldnn::primitive_id non_max_supression_mutable_id_w_first = layer_type_name_ID(op) + "_md_write_first";
-            auto nms_mutable_prim_first = cldnn::mutable_data(non_max_supression_mutable_id_w_first, shared_memory.back());
-            p.primitivesToIRLayersMap[non_max_supression_mutable_id_w_first] = { op->get_friendly_name() };
+            auto nms_mutable_prim_first = cldnn::mutable_data(non_max_supression_mutable_id_w_first,
+                                                              shared_memory.back(),
+                                                              op->get_friendly_name());
             p.primitiveIDs[non_max_supression_mutable_id_w_first] = non_max_supression_mutable_id_w_first;
             p.AddPrimitive(nms_mutable_prim_first);
             inputPrimitives.push_back(non_max_supression_mutable_id_w_first);
@@ -112,7 +125,9 @@ void CreateNonMaxSuppressionIEInternalOp(Program& p, const std::shared_ptr<ngrap
             reorderedInputs[1],
             static_cast<int>(outputIndices),
             op->m_center_point_box,
-            op->m_sort_result_descending);
+            op->m_sort_result_descending,
+            "", "", "", "", "", "",
+            op->get_friendly_name());
 
     prim.output_data_type = DataTypeFromPrecision(out_type);
 
@@ -136,15 +151,19 @@ void CreateNonMaxSuppressionIEInternalOp(Program& p, const std::shared_ptr<ngrap
     switch (num_output) {
         case 3: {
             cldnn::primitive_id non_max_supression_id_r_second = layer_type_name_ID(op) + ".2";
-            auto nms_mutable_prim_r_second = cldnn::mutable_data(non_max_supression_id_r_second, { nonMaxSupressionLayerName }, shared_memory.front());
-            p.primitivesToIRLayersMap[non_max_supression_id_r_second] = { op->get_friendly_name() };
+            auto nms_mutable_prim_r_second = cldnn::mutable_data(non_max_supression_id_r_second,
+                                                                 { nonMaxSupressionLayerName },
+                                                                 shared_memory.front(),
+                                                                 op->get_friendly_name());
             p.primitiveIDs[non_max_supression_id_r_second] = non_max_supression_id_r_second;
             p.AddPrimitive(nms_mutable_prim_r_second);
         }
         case 2: {
             cldnn::primitive_id non_max_supression_id_r_first = layer_type_name_ID(op) + ".1";
-            auto nms_mutable_prim_r_first = cldnn::mutable_data(non_max_supression_id_r_first, { nonMaxSupressionLayerName }, shared_memory.back());
-            p.primitivesToIRLayersMap[non_max_supression_id_r_first] = { op->get_friendly_name() };
+            auto nms_mutable_prim_r_first = cldnn::mutable_data(non_max_supression_id_r_first,
+                                                                { nonMaxSupressionLayerName },
+                                                                shared_memory.back(),
+                                                                op->get_friendly_name());
             p.primitiveIDs[non_max_supression_id_r_first] = non_max_supression_id_r_first;
             p.AddPrimitive(nms_mutable_prim_r_first);
         }
diff --git a/inference-engine/src/cldnn_engine/ops/normalize_l2.cpp b/inference-engine/src/cldnn_engine/ops/normalize_l2.cpp
index 85f2eb95de8..315dee55952 100644
--- a/inference-engine/src/cldnn_engine/ops/normalize_l2.cpp
+++ b/inference-engine/src/cldnn_engine/ops/normalize_l2.cpp
@@ -45,14 +45,15 @@ void CreateNormalizeL2Op(Program& p, const std::shared_ptr<ngraph::op::v0::Norma
 
     std::memcpy(&buf[0], scale->get_data_ptr(), bufSize);
     auto scalesName = layerName + "_cldnn_input_scales";
-    p.AddPrimitive(cldnn::data(scalesName, mem));
+    p.AddPrimitive(cldnn::data(scalesName, mem, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(scalesName, layerName, op);
 
     auto normPrim = cldnn::normalize(layerName,
                                      inputPrimitives[0],
                                      scalesName,
                                      across_spatial,
-                                     eps);
+                                     eps,
+                                     op->get_friendly_name());
 
     p.AddPrimitive(normPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/one_hot.cpp b/inference-engine/src/cldnn_engine/ops/one_hot.cpp
index 3d792bda8ae..b7c4fe8a126 100644
--- a/inference-engine/src/cldnn_engine/ops/one_hot.cpp
+++ b/inference-engine/src/cldnn_engine/ops/one_hot.cpp
@@ -53,7 +53,8 @@ void CreateOneHotOp(Program& p, const std::shared_ptr<ngraph::op::v1::OneHot>& o
                                      DataTypeFromPrecision(op->get_output_element_type(0)),
                                      static_cast<uint16_t>(axis),
                                      on_value,
-                                     off_value);
+                                     off_value,
+                                     op->get_friendly_name());
 
     p.AddPrimitive(oneHotPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/pad.cpp b/inference-engine/src/cldnn_engine/ops/pad.cpp
index 0d409414b58..40336df057c 100644
--- a/inference-engine/src/cldnn_engine/ops/pad.cpp
+++ b/inference-engine/src/cldnn_engine/ops/pad.cpp
@@ -66,7 +66,8 @@ void CreatePadOp(Program& p, const std::shared_ptr<ngraph::op::v1::Pad>& op) {
                                   pads_begin,
                                   pads_end,
                                   border_mode,
-                                  pad_value);
+                                  pad_value,
+                                  op->get_friendly_name());
 
     p.AddPrimitive(tilePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/parameter.cpp b/inference-engine/src/cldnn_engine/ops/parameter.cpp
index b68593dd0a5..6dd43841cf3 100644
--- a/inference-engine/src/cldnn_engine/ops/parameter.cpp
+++ b/inference-engine/src/cldnn_engine/ops/parameter.cpp
@@ -195,8 +195,8 @@ void CreateParameterOp(Program& p, const std::shared_ptr<ngraph::op::v0::Paramet
                                     cldnn::format::nv12, { 1, 1, width, height });
             cldnn::layout uv_layout(DataTypeFromPrecision(ip),
                                     cldnn::format::nv12, { 1, 2, width / 2, height / 2 });
-            auto inputY = cldnn::input_layout(y_name, y_layout);
-            auto inputUV = cldnn::input_layout(uv_name, uv_layout);
+            auto inputY = cldnn::input_layout(y_name, y_layout, inputInfo->name());
+            auto inputUV = cldnn::input_layout(uv_name, uv_layout, inputInfo->name());
 
             p.AddPrimitive(inputY);
             p.inputLayouts.insert({ inputInfo->name() + "_Y" + std::to_string(i), y_layout });
@@ -205,20 +205,29 @@ void CreateParameterOp(Program& p, const std::shared_ptr<ngraph::op::v0::Paramet
             switch (preProcess.getMeanVariant()) {
             case NONE:
             case MEAN_VALUE: {
-                p.AddPrimitive(cldnn::reorder(preprocessPrimID, y_name, uv_name, networkInputLayout, meanValues));
+                p.AddPrimitive(cldnn::reorder(preprocessPrimID,
+                                              y_name,
+                                              uv_name,
+                                              networkInputLayout,
+                                              meanValues,
+                                              cldnn::reorder_mean_mode::subtract,
+                                              inputInfo->name()));
                 break;
             }
             case MEAN_IMAGE: {
-                p.AddPrimitive(cldnn::reorder(preprocessPrimID, y_name, uv_name, networkInputLayout, meanBlobID));
+                p.AddPrimitive(cldnn::reorder(preprocessPrimID,
+                                              y_name,
+                                              uv_name,
+                                              networkInputLayout,
+                                              meanBlobID,
+                                              cldnn::reorder_mean_mode::subtract,
+                                              inputInfo->name()));
                 break;
             }
             default: IE_THROW(Unexpected) << "Invalid mean variant in input " + inputName;
                 break;
             }
 
-            p.primitivesToIRLayersMap[preprocessPrimID] = { inputInfo->name() };
-            p.primitivesToIRLayersMap[y_name] = { inputInfo->name() };
-            p.primitivesToIRLayersMap[uv_name] = { inputInfo->name() };
             p.profilingIDs.push_back(preprocessPrimID);
             p.InitProfileInfo(preprocessPrimID, "Reorder");
             p.primitiveIDs[inputName] = preprocessPrimID;  // If it is batched blob, it will be overwritten afterwards.
@@ -228,7 +237,7 @@ void CreateParameterOp(Program& p, const std::shared_ptr<ngraph::op::v0::Paramet
 
         if (inputDims[0] > 1) {
             auto concatPrimID = "concat:" + inputName + Program::m_preProcessTag;
-            p.AddPrimitive(cldnn::concatenation(concatPrimID, reorders, cldnn::concatenation::along_b));
+            p.AddPrimitive(cldnn::concatenation(concatPrimID, reorders, cldnn::concatenation::along_b, op->get_friendly_name()));
             p.primitiveIDs[inputName] = concatPrimID;
         }
     } else {
@@ -237,20 +246,26 @@ void CreateParameterOp(Program& p, const std::shared_ptr<ngraph::op::v0::Paramet
         inputLayout.data_type = DataTypeFromPrecision(ip);
         p.inputLayouts.insert({ inputInfo->name(), inputLayout });
 
-        p.AddPrimitive(cldnn::input_layout(inputName, inputLayout));
-        p.primitivesToIRLayersMap[inputName] = { inputInfo->name() };
+        p.AddPrimitive(cldnn::input_layout(inputName, inputLayout, inputInfo->name()));
 
         switch (preProcess.getMeanVariant()) {
         case NONE:
         case MEAN_VALUE: {
-            p.AddPrimitive(cldnn::reorder(preprocessPrimID, inputName, networkInputLayout, meanValues));
+            p.AddPrimitive(cldnn::reorder(preprocessPrimID,
+                                          inputName,
+                                          networkInputLayout,
+                                          meanValues,
+                                          cldnn::reorder_mean_mode::subtract,
+                                          op->get_friendly_name()));
             break;
         }
         case MEAN_IMAGE: {
             p.AddPrimitive(cldnn::reorder(preprocessPrimID,
-                                        inputName,
-                                        networkInputLayout,
-                                        meanBlobID));
+                                          inputName,
+                                          networkInputLayout,
+                                          meanBlobID,
+                                          cldnn::reorder_mean_mode::subtract,
+                                          op->get_friendly_name()));
             break;
         }
         default: IE_THROW() << "Invalid mean variant in input " << inputName;
diff --git a/inference-engine/src/cldnn_engine/ops/pooling.cpp b/inference-engine/src/cldnn_engine/ops/pooling.cpp
index f1bf6952292..1e0db7bd204 100644
--- a/inference-engine/src/cldnn_engine/ops/pooling.cpp
+++ b/inference-engine/src/cldnn_engine/ops/pooling.cpp
@@ -70,7 +70,8 @@ void CreateAvgPoolOp(Program& p, const std::shared_ptr<ngraph::op::v1::AvgPool>&
                                    params.stride,
                                    params.pad_begin,
                                    CldnnTensorFromIEDims(op->get_output_shape(0)),
-                                   DataTypeFromPrecision(op->get_output_element_type(0)));
+                                   DataTypeFromPrecision(op->get_output_element_type(0)),
+                                   op->get_friendly_name());
     poolPrim.pad_end = params.pad_end;
     p.AddPrimitive(poolPrim);
     p.AddPrimitiveToProfiler(op);
@@ -89,7 +90,8 @@ void CreateMaxPoolOp(Program& p, const std::shared_ptr<ngraph::op::v1::MaxPool>&
                                    params.stride,
                                    params.pad_begin,
                                    CldnnTensorFromIEDims(op->get_output_shape(0)),
-                                   DataTypeFromPrecision(op->get_output_element_type(0)));
+                                   DataTypeFromPrecision(op->get_output_element_type(0)),
+                                   op->get_friendly_name());
     poolPrim.pad_end = params.pad_end;
     p.AddPrimitive(poolPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/prior_box.cpp b/inference-engine/src/cldnn_engine/ops/prior_box.cpp
index 6cf0aaa6535..43eb5a69941 100644
--- a/inference-engine/src/cldnn_engine/ops/prior_box.cpp
+++ b/inference-engine/src/cldnn_engine/ops/prior_box.cpp
@@ -54,7 +54,8 @@ void CreatePriorBoxClusteredOp(Program& p, const std::shared_ptr<ngraph::op::v0:
                                          offset,
                                          width,
                                          height,
-                                         DataTypeFromPrecision(op->get_output_element_type(0)));
+                                         DataTypeFromPrecision(op->get_output_element_type(0)),
+                                         op->get_friendly_name());
 
     p.AddPrimitive(priorBoxPrim);
     p.AddPrimitiveToProfiler(op);
@@ -103,7 +104,8 @@ void CreatePriorBoxOp(Program& p, const std::shared_ptr<ngraph::op::v0::PriorBox
                                          scale_all_sizes,
                                          fixed_ratio,
                                          fixed_size,
-                                         density);
+                                         density,
+                                         op->get_friendly_name());
 
     p.AddPrimitive(priorBoxPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/proposal.cpp b/inference-engine/src/cldnn_engine/ops/proposal.cpp
index d5b906e5e6e..9be2f1d4e99 100644
--- a/inference-engine/src/cldnn_engine/ops/proposal.cpp
+++ b/inference-engine/src/cldnn_engine/ops/proposal.cpp
@@ -9,6 +9,7 @@
 
 #include "cldnn/primitives/proposal.hpp"
 #include "cldnn/primitives/mutable_data.hpp"
+#include "cldnn/runtime/debug_configuration.hpp"
 
 namespace CLDNNPlugin {
 
@@ -62,11 +63,16 @@ void CreateProposalOp(Program& p, const std::shared_ptr<ngraph::op::v0::Proposal
                                                     DefaultFormatForDims(op->get_output_shape(1).size()),
                                                     CldnnTensorFromIEDims(op->get_output_shape(1)));
 
+        GPU_DEBUG_GET_INSTANCE(debug_config);
+        GPU_DEBUG_IF(debug_config->verbose >= 2) {
+            GPU_DEBUG_COUT << "[" << layer_type_name_ID(op) << ": mutable data]" << std::endl;
+        }
         auto shared_memory = p.GetEngine().allocate_memory(mutableLayout);
 
         cldnn::primitive_id proposal_mutable_id_w = layer_type_name_ID(op) + "_md_write";
-        auto argmax_mutable_prim = cldnn::mutable_data(proposal_mutable_id_w, shared_memory);
-        p.primitivesToIRLayersMap[proposal_mutable_id_w] = { op->get_friendly_name() };
+        auto argmax_mutable_prim = cldnn::mutable_data(proposal_mutable_id_w,
+                                                       shared_memory,
+                                                       op->get_friendly_name());
         p.primitiveIDs[proposal_mutable_id_w] = proposal_mutable_id_w;
         p.AddPrimitive(argmax_mutable_prim);
         inputPrimitives.push_back(proposal_mutable_id_w);
@@ -96,13 +102,16 @@ void CreateProposalOp(Program& p, const std::shared_ptr<ngraph::op::v0::Proposal
                                             clip_after_nms,
                                             round_ratios,
                                             shift_anchors,
-                                            normalize);
+                                            normalize,
+                                            op->get_friendly_name());
 
         p.AddPrimitive(proposalPrim);
 
         cldnn::primitive_id proposal_mutable_id_r = layer_type_name_ID(op) + ".1";
-        auto argmax_mutable_prim_r = cldnn::mutable_data(proposal_mutable_id_r, { proposalLayerName }, shared_memory);
-        p.primitivesToIRLayersMap[proposal_mutable_id_r] = { op->get_friendly_name() };
+        auto argmax_mutable_prim_r = cldnn::mutable_data(proposal_mutable_id_r,
+                                                         { proposalLayerName },
+                                                         shared_memory,
+                                                         op->get_friendly_name());
         p.primitiveIDs[proposal_mutable_id_r] = proposal_mutable_id_r;
         p.AddPrimitive(argmax_mutable_prim_r);
 
@@ -134,7 +143,8 @@ void CreateProposalOp(Program& p, const std::shared_ptr<ngraph::op::v0::Proposal
                                         clip_after_nms,
                                         round_ratios,
                                         shift_anchors,
-                                        normalize);
+                                        normalize,
+                                        op->get_friendly_name());
 
     p.AddPrimitive(proposalPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/reduce.cpp b/inference-engine/src/cldnn_engine/ops/reduce.cpp
index b336a2e78fa..47a54c70299 100644
--- a/inference-engine/src/cldnn_engine/ops/reduce.cpp
+++ b/inference-engine/src/cldnn_engine/ops/reduce.cpp
@@ -75,7 +75,8 @@ void CreateReduceOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cldnn::
                                     inputPrimitives[0],
                                     mode,
                                     axes,
-                                    static_cast<int32_t>(keep_dims));
+                                    static_cast<int32_t>(keep_dims),
+                                    op->get_friendly_name());
 
     p.AddPrimitive(reducePrim);
 
@@ -96,7 +97,7 @@ void CreateReduceOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cldnn::
                 outTensor = cldnn::tensor(TensorValue(out_shape[0]), TensorValue(out_shape[1]),
                                           1, TensorValue(out_shape[2]));
         }
-        auto reshape_prim = cldnn::reshape(resultLayerName, layerName, outTensor);
+        auto reshape_prim = cldnn::reshape(resultLayerName, layerName, outTensor, op->get_friendly_name());
         p.AddPrimitive(reshape_prim);
         p.AddPrimitiveToProfiler(op, resultLayerName);
     }
@@ -112,7 +113,13 @@ void CreateReduceOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cldnn::
         else if (rank - rawAxes.size() <= 4)
             out_format = cldnn::format::bfyx;
 
-        auto reorder_prim = cldnn::reorder(reorderLayerName, resultLayerName, out_format, out_dt);
+        auto reorder_prim = cldnn::reorder(reorderLayerName,
+                                           resultLayerName,
+                                           out_format,
+                                           out_dt,
+                                           std::vector<float>(),
+                                           cldnn::reorder_mean_mode::subtract,
+                                           op->get_friendly_name());
         p.AddPrimitive(reorder_prim);
         p.AddPrimitiveToProfiler(op, reorderLayerName);
     } else {
diff --git a/inference-engine/src/cldnn_engine/ops/region_yolo.cpp b/inference-engine/src/cldnn_engine/ops/region_yolo.cpp
index 348dd0f7eeb..314950027cb 100644
--- a/inference-engine/src/cldnn_engine/ops/region_yolo.cpp
+++ b/inference-engine/src/cldnn_engine/ops/region_yolo.cpp
@@ -28,7 +28,8 @@ void CreateRegionYoloOp(Program& p, const std::shared_ptr<ngraph::op::v0::Region
                                          classes,
                                          num,
                                          mask_size,
-                                         do_softmax);
+                                         do_softmax,
+                                         op->get_friendly_name());
 
     p.AddPrimitive(regionPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/reorg_yolo.cpp b/inference-engine/src/cldnn_engine/ops/reorg_yolo.cpp
index 4a7f54cf810..9c47ccc9fb0 100644
--- a/inference-engine/src/cldnn_engine/ops/reorg_yolo.cpp
+++ b/inference-engine/src/cldnn_engine/ops/reorg_yolo.cpp
@@ -20,7 +20,8 @@ void CreateReorgYoloOp(Program& p, const std::shared_ptr<ngraph::op::v0::ReorgYo
 
     auto reorgPrim = cldnn::reorg_yolo(layerName,
                                        inputPrimitives[0],
-                                       stride);
+                                       stride,
+                                       op->get_friendly_name());
 
     p.AddPrimitive(reorgPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/reshape.cpp b/inference-engine/src/cldnn_engine/ops/reshape.cpp
index f0084bb6a1c..a4978fbae29 100644
--- a/inference-engine/src/cldnn_engine/ops/reshape.cpp
+++ b/inference-engine/src/cldnn_engine/ops/reshape.cpp
@@ -36,9 +36,13 @@ void CreateCommonReshapeOp(Program& p, const std::shared_ptr<ngraph::Node>& op)
         }
 
         cldnn::layout outputLayout(DataTypeFromPrecision(op->get_output_element_type(0)), outputFormat, outTensor);
-        p.AddPrimitive(cldnn::reorder(reorderId, reshapeInputId, outputLayout));
+        p.AddPrimitive(cldnn::reorder(reorderId,
+                                      reshapeInputId,
+                                      outputLayout,
+                                      std::vector<float>(),
+                                      cldnn::reorder_mean_mode::subtract,
+                                      op->get_friendly_name()));
         p.InitProfileInfo(reorderId, "Reorder", false, InferenceEngine::InferenceEngineProfileInfo::EXECUTED, layerName);
-        p.primitivesToIRLayersMap[reorderId] = { op->get_friendly_name() };
         p.primitiveIDs[layerName + "_reorder"] = reorderId;
         p.primitiveIDs[reorderId] = reorderId;
         p.profilingIDs.push_back(reorderId);
@@ -47,7 +51,8 @@ void CreateCommonReshapeOp(Program& p, const std::shared_ptr<ngraph::Node>& op)
 
     auto reshapePrim = cldnn::reshape(layerName,
                                       reshapeInputId,
-                                      outTensor);
+                                      outTensor,
+                                      op->get_friendly_name());
 
     p.AddPrimitive(reshapePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/result.cpp b/inference-engine/src/cldnn_engine/ops/result.cpp
index fe0d0f05658..c1219ad8fba 100644
--- a/inference-engine/src/cldnn_engine/ops/result.cpp
+++ b/inference-engine/src/cldnn_engine/ops/result.cpp
@@ -56,9 +56,12 @@ void CreateResultOp(Program& p, const std::shared_ptr<ngraph::op::v0::Result>& o
     std::string outputID = inputs[0];
 
     p.AddPrimitive(cldnn::reorder(outLayerName,
-                                outputID,
-                                FormatFromLayout(outputData->getLayout()),
-                                DataTypeFromPrecision(precision)));
+                                  outputID,
+                                  FormatFromLayout(outputData->getLayout()),
+                                  DataTypeFromPrecision(precision),
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
     p.InitProfileInfo(outLayerName, "reorder");
     p.profilingIDs.push_back(outLayerName);
     p.primitiveIDs[outLayerName] = outLayerName;
diff --git a/inference-engine/src/cldnn_engine/ops/reverse_sequence.cpp b/inference-engine/src/cldnn_engine/ops/reverse_sequence.cpp
index 766bbc89a31..6421a01dc75 100644
--- a/inference-engine/src/cldnn_engine/ops/reverse_sequence.cpp
+++ b/inference-engine/src/cldnn_engine/ops/reverse_sequence.cpp
@@ -22,7 +22,8 @@ void CreateReverseSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v0::R
                                                        inputPrimitives[0],
                                                        inputPrimitives[1],
                                                        seq_axis,
-                                                       batch_axis);
+                                                       batch_axis,
+                                                       op->get_friendly_name());
 
     p.AddPrimitive(reverseSequencePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/rnn.cpp b/inference-engine/src/cldnn_engine/ops/rnn.cpp
index 2d4705f1a91..1ebaa0a7868 100644
--- a/inference-engine/src/cldnn_engine/ops/rnn.cpp
+++ b/inference-engine/src/cldnn_engine/ops/rnn.cpp
@@ -107,8 +107,13 @@ void CreateLSTMCellOp(Program& p, const std::shared_ptr<ngraph::op::v4::LSTMCell
     cldnn::tensor inStateShape = { lstm_batch_size, 1, lstm_hidden_size, 1 };
     cldnn::layout inputLayout = cldnn::layout(lstm_dtype, cldnn::format::bfyx, inputShape);
     cldnn::layout hiddenLayout = cldnn::layout(lstm_dtype, cldnn::format::bfyx, inStateShape);
-    p.AddPrimitive(cldnn::reshape(inReshapeID, inputPrimitives[0], inputShape));
-    p.AddPrimitive(cldnn::reorder(permuteID, inReshapeID, inputLayout));
+    p.AddPrimitive(cldnn::reshape(inReshapeID, inputPrimitives[0], inputShape, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reorder(permuteID,
+                                  inReshapeID,
+                                  inputLayout,
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
 
     p.AddInnerPrimitiveToProfiler(inReshapeID, op->get_friendly_name(), op);
     p.AddInnerPrimitiveToProfiler(permuteID, op->get_friendly_name(), op);
@@ -117,11 +122,24 @@ void CreateLSTMCellOp(Program& p, const std::shared_ptr<ngraph::op::v4::LSTMCell
     std::string hiddenInStr = inHiddenReorderID + "_1";
     std::string cellInResh = inHiddenReshapeID + "_2";
     std::string cellInStr = inHiddenReorderID + "_2";
-    p.AddPrimitive(cldnn::reshape(hiddenInResh, inputPrimitives[1], inStateShape));
-    p.AddPrimitive(cldnn::reorder(hiddenInStr, hiddenInResh, hiddenLayout));
-    p.AddPrimitive(cldnn::reshape(cellInResh, inputPrimitives[2], inStateShape));
-    p.AddPrimitive(cldnn::reorder(cellInStr, cellInResh, hiddenLayout));
-    p.AddPrimitive(cldnn::concatenation(input_concatID, { permuteID, hiddenInStr }, cldnn::concatenation::concatenation_axis::along_x));
+    p.AddPrimitive(cldnn::reshape(hiddenInResh, inputPrimitives[1], inStateShape, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reorder(hiddenInStr,
+                                  hiddenInResh,
+                                  hiddenLayout,
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reshape(cellInResh, inputPrimitives[2], inStateShape, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reorder(cellInStr,
+                                  cellInResh,
+                                  hiddenLayout,
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
+    p.AddPrimitive(cldnn::concatenation(input_concatID,
+                                        { permuteID, hiddenInStr },
+                                        cldnn::concatenation::concatenation_axis::along_x,
+                                        op->get_friendly_name()));
 
     p.AddInnerPrimitiveToProfiler(hiddenInResh, op->get_friendly_name(), op);
     p.AddInnerPrimitiveToProfiler(hiddenInStr, op->get_friendly_name(), op);
@@ -139,14 +157,19 @@ void CreateLSTMCellOp(Program& p, const std::shared_ptr<ngraph::op::v4::LSTMCell
     std::string crop_id = layerName + "_crop";
 
     cldnn::primitive_id WRconcatID = layerName + "_WRconcat";
-    p.AddPrimitive(cldnn::concatenation(WRconcatID, { weightID, recurrentID }, cldnn::concatenation::concatenation_axis::along_f));
+    p.AddPrimitive(cldnn::concatenation(WRconcatID, { weightID, recurrentID }, cldnn::concatenation::concatenation_axis::along_f, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(WRconcatID, op->get_friendly_name(), op);
 
-    p.AddPrimitive(cldnn::fully_connected(lstm_fc_id, input_concatID, WRconcatID, hasBias ? biasID : ""));
-    p.AddPrimitive(cldnn::reshape(gemmReshapeID, lstm_fc_id, gemmSz));
-    p.AddPrimitive(cldnn::reorder(gemmReorderID, gemmReshapeID, gemmLayout));
-    p.AddPrimitive(cldnn::lstm_elt(lstm_elt_id, gemmReorderID, cellInStr,
-                                 clip, 0, activations, activation_params, cldnn::lstm_weights_order::fizo));
+    p.AddPrimitive(cldnn::fully_connected(lstm_fc_id, input_concatID, WRconcatID, hasBias ? biasID : "", op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reshape(gemmReshapeID, lstm_fc_id, gemmSz, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reorder(gemmReorderID,
+                                  gemmReshapeID,
+                                  gemmLayout,
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
+    p.AddPrimitive(cldnn::lstm_elt(lstm_elt_id, gemmReorderID, cellInStr, clip, 0, activations,
+                                   activation_params, cldnn::lstm_weights_order::fizo, 0, op->get_friendly_name()));
 
     p.AddInnerPrimitiveToProfiler(lstm_fc_id, op->get_friendly_name(), op);
     p.AddInnerPrimitiveToProfiler(gemmReshapeID, op->get_friendly_name(), op);
@@ -156,16 +179,16 @@ void CreateLSTMCellOp(Program& p, const std::shared_ptr<ngraph::op::v4::LSTMCell
     cldnn::tensor outSz = cldnn::tensor{ lstm_batch_size, lstm_hidden_size, 1, 1 };
     cldnn::primitive_id outputHiddenCropID = layerName + "_hc";
     cldnn::primitive_id outputHiddenID = layerName + ".0";
-    p.AddPrimitive(cldnn::crop(outputHiddenCropID, lstm_elt_id, hiddenSz, cldnn::tensor{0, 0, 0, 0}));
+    p.AddPrimitive(cldnn::crop(outputHiddenCropID, lstm_elt_id, hiddenSz, cldnn::tensor{0, 0, 0, 0}, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(outputHiddenCropID, op->get_friendly_name(), op);
-    p.AddPrimitive(cldnn::reshape(outputHiddenID, outputHiddenCropID, outSz));
+    p.AddPrimitive(cldnn::reshape(outputHiddenID, outputHiddenCropID, outSz, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(outputHiddenID, op->get_friendly_name(), op);
 
     cldnn::primitive_id outputCellCropID = layerName + "_cc";
     cldnn::primitive_id outputCellID = layerName + ".1";
-    p.AddPrimitive(cldnn::crop(outputCellCropID, lstm_elt_id, hiddenSz, cellCropSz));
+    p.AddPrimitive(cldnn::crop(outputCellCropID, lstm_elt_id, hiddenSz, cellCropSz, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(outputCellCropID, op->get_friendly_name(), op);
-    p.AddPrimitive(cldnn::reshape(outputCellID, outputCellCropID, outSz));
+    p.AddPrimitive(cldnn::reshape(outputCellID, outputCellCropID, outSz, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(outputCellID, op->get_friendly_name(), op);
 
     // output primitive IDs
@@ -223,11 +246,16 @@ void CreateLSTMSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v5::LSTM
     cldnn::tensor inputShape = { lstm_batch_size, lstm_sequence_len, lstm_input_size, 1 };
     cldnn::tensor inStateShape = { lstm_batch_size, 1, lstm_hidden_size, 1 };
     cldnn::layout inputLayout = cldnn::layout(lstm_dtype, cldnn::format::bfyx, inputShape);
-    p.AddPrimitive(cldnn::reshape(inReshapeID, inputPrimitives[0], inputShape));
-    p.AddPrimitive(cldnn::reorder(permuteID, inReshapeID, inputLayout));
+    p.AddPrimitive(cldnn::reshape(inReshapeID, inputPrimitives[0], inputShape, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reorder(permuteID,
+                                  inReshapeID,
+                                  inputLayout,
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
 
-    p.AddPrimitive(cldnn::reshape(inHiddenStateID, inputPrimitives[1], inStateShape));
-    p.AddPrimitive(cldnn::reshape(inCellStateID, inputPrimitives[2], inStateShape));
+    p.AddPrimitive(cldnn::reshape(inHiddenStateID, inputPrimitives[1], inStateShape, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reshape(inCellStateID, inputPrimitives[2], inStateShape, op->get_friendly_name()));
 
     p.AddInnerPrimitiveToProfiler(inReshapeID, op->get_friendly_name(), op);
     p.AddInnerPrimitiveToProfiler(permuteID, op->get_friendly_name(), op);
@@ -243,12 +271,12 @@ void CreateLSTMSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v5::LSTM
     cldnn::primitive_id inputCropID = layerName + "_inputCrop";
 
     cldnn::primitive_id WRconcatID = layerName + "_WRconcat";
-    p.AddPrimitive(cldnn::concatenation(WRconcatID, { weightID, recurrentID }, cldnn::concatenation::concatenation_axis::along_y));
+    p.AddPrimitive(cldnn::concatenation(WRconcatID, { weightID, recurrentID }, cldnn::concatenation::concatenation_axis::along_y, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(WRconcatID, op->get_friendly_name(), op);
 
     std::vector<size_t> WRreshapeSize = { 4 * size_t(lstm_hidden_size), size_t(lstm_input_size + lstm_hidden_size) };
     cldnn::primitive_id WRreshapeID = WRconcatID + "_reshape";
-    auto reshapeInPrim = cldnn::reshape(WRreshapeID, WRconcatID, CldnnTensorFromIEDims(WRreshapeSize));
+    auto reshapeInPrim = cldnn::reshape(WRreshapeID, WRconcatID, CldnnTensorFromIEDims(WRreshapeSize), op->get_friendly_name());
     p.AddPrimitive(reshapeInPrim);
     p.AddInnerPrimitiveToProfiler(WRreshapeID, op->get_friendly_name(), op);
 
@@ -267,30 +295,35 @@ void CreateLSTMSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v5::LSTM
         cldnn::tensor crop_tensor{ inputShape.batch[0], 1, inputShape.spatial[0], inputShape.spatial[1] };
         cldnn::tensor offset_tensor{ 0, static_cast<cldnn::tensor::value_type>(seqIdx), 0, 0 };
         cldnn::primitive_id inputCrop_id = inputCropID + ":" + seqIdx_str;
-        p.AddPrimitive(cldnn::crop(inputCrop_id, permuteID, crop_tensor, offset_tensor));
+        p.AddPrimitive(cldnn::crop(inputCrop_id, permuteID, crop_tensor, offset_tensor, op->get_friendly_name()));
         p.AddInnerPrimitiveToProfiler(inputCrop_id, op->get_friendly_name(), op);
 
-        p.AddPrimitive(cldnn::concatenation(concatID, { inputCrop_id, hiddenStr }, cldnn::concatenation::concatenation_axis::along_x));
+        p.AddPrimitive(cldnn::concatenation(concatID, { inputCrop_id, hiddenStr }, cldnn::concatenation::concatenation_axis::along_x, op->get_friendly_name()));
         p.AddInnerPrimitiveToProfiler(concatID, op->get_friendly_name(), op);
-        p.AddPrimitive(cldnn::fully_connected(lstm_fc_id, concatID, WRreshapeID, biasID));
+        p.AddPrimitive(cldnn::fully_connected(lstm_fc_id, concatID, WRreshapeID, biasID, op->get_friendly_name()));
         p.AddInnerPrimitiveToProfiler(lstm_fc_id, op->get_friendly_name(), op);
 
-        p.AddPrimitive(cldnn::reshape(lstm_fc_resh_id, lstm_fc_id, gemmSz));
-        p.AddPrimitive(cldnn::reorder(lstm_fc_reor_id, lstm_fc_resh_id, gemmLayout));
-        p.AddPrimitive(cldnn::lstm_elt(lstm_elt_id, lstm_fc_reor_id, cellStr,
-                                     clip, 0, activations, activation_params, cldnn::lstm_weights_order::fizo));
+        p.AddPrimitive(cldnn::reshape(lstm_fc_resh_id, lstm_fc_id, gemmSz, op->get_friendly_name()));
+        p.AddPrimitive(cldnn::reorder(lstm_fc_reor_id,
+                                      lstm_fc_resh_id,
+                                      gemmLayout,
+                                      std::vector<float>(),
+                                      cldnn::reorder_mean_mode::subtract,
+                                      op->get_friendly_name()));
+        p.AddPrimitive(cldnn::lstm_elt(lstm_elt_id, lstm_fc_reor_id, cellStr, clip, 0, activations,
+                                       activation_params, cldnn::lstm_weights_order::fizo, 0, op->get_friendly_name()));
         p.AddInnerPrimitiveToProfiler(lstm_fc_resh_id, op->get_friendly_name(), op);
         p.AddInnerPrimitiveToProfiler(lstm_fc_reor_id, op->get_friendly_name(), op);
         p.AddInnerPrimitiveToProfiler(lstm_elt_id, op->get_friendly_name(), op);
 
         hiddenStr = crop_id + ":hidden";
         cellStr = crop_id + ":cell";
-        p.AddPrimitive(cldnn::crop(hiddenStr, lstm_elt_id, hiddenSz, cldnn::tensor{ 0, 0, 0, 0 }));
+        p.AddPrimitive(cldnn::crop(hiddenStr, lstm_elt_id, hiddenSz, cldnn::tensor{ 0, 0, 0, 0 }, op->get_friendly_name()));
         p.AddInnerPrimitiveToProfiler(hiddenStr, op->get_friendly_name(), op);
         output_ids_offsets.push_back(hiddenStr);
 
         if (i < lstm_sequence_len - 1) {
-            p.AddPrimitive(cldnn::crop(cellStr, lstm_elt_id, hiddenSz, cellCropSz));
+            p.AddPrimitive(cldnn::crop(cellStr, lstm_elt_id, hiddenSz, cellCropSz, op->get_friendly_name()));
             p.AddInnerPrimitiveToProfiler(cellStr, op->get_friendly_name(), op);
         } else {
             // last hidden state crop (output 2)
@@ -299,7 +332,7 @@ void CreateLSTMSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v5::LSTM
             p.primitiveIDs[outputHiddenID] = hiddenStr;
 
             // last cell state crop (output 3)
-            p.AddPrimitive(cldnn::crop(cellStr, lstm_elt_id, hiddenSz, cellCropSz));
+            p.AddPrimitive(cldnn::crop(cellStr, lstm_elt_id, hiddenSz, cellCropSz, op->get_friendly_name()));
             cldnn::primitive_id outputCellID = layerName + ".2";
             p.AddInnerPrimitiveToProfiler(cellStr, op->get_friendly_name(), op);
             p.primitiveIDs[outputCellID] = cellStr;
@@ -310,7 +343,7 @@ void CreateLSTMSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v5::LSTM
     // concatenated hidden state (output 1)
     cldnn::primitive_id outputConcatID = layerName + ".0";
     cldnn::primitive_id concatStr = layerName + ":hiddenConcat";
-    p.AddPrimitive(cldnn::concatenation(concatStr, output_ids_offsets, cldnn::concatenation::along_f));
+    p.AddPrimitive(cldnn::concatenation(concatStr, output_ids_offsets, cldnn::concatenation::along_f, op->get_friendly_name()));
 
     p.primitiveIDs[outputConcatID] = concatStr;
     p.primitiveIDs[layerName] = concatStr;
diff --git a/inference-engine/src/cldnn_engine/ops/roi_pooling.cpp b/inference-engine/src/cldnn_engine/ops/roi_pooling.cpp
index f2087756405..5de1a56019c 100644
--- a/inference-engine/src/cldnn_engine/ops/roi_pooling.cpp
+++ b/inference-engine/src/cldnn_engine/ops/roi_pooling.cpp
@@ -57,7 +57,8 @@ void CreateDeformablePSROIPoolingOp(Program& p, const std::shared_ptr<ngraph::op
                                                group_size,
                                                output_dim,
                                                spatial_bins_x,
-                                               spatial_bins_y);
+                                               spatial_bins_y,
+                                               op->get_friendly_name());
     p.AddPrimitive(psROIPoolingPrim);
     p.AddPrimitiveToProfiler(op);
 }
@@ -85,7 +86,8 @@ void CreatePSROIPoolingOp(Program& p, const std::shared_ptr<ngraph::op::v0::PSRO
                                                spatial_scale,
                                                output_dim,
                                                spatial_bins_x,
-                                               spatial_bins_y);
+                                               spatial_bins_y,
+                                               op->get_friendly_name());
     p.AddPrimitive(psROIPoolingPrim);
     p.AddPrimitiveToProfiler(op);
 }
@@ -110,7 +112,11 @@ void CreateROIPoolingOp(Program& p, const std::shared_ptr<ngraph::op::v0::ROIPoo
                                              position_sensitive,
                                              pooled_width,
                                              pooled_height,
-                                             spatial_scale);
+                                             spatial_scale,
+                                             0,
+                                             1,
+                                             1,
+                                             op->get_friendly_name());
 
     p.AddPrimitive(roiPoolingPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/scatter_elements_update.cpp b/inference-engine/src/cldnn_engine/ops/scatter_elements_update.cpp
index 19f63dbf3a3..487587a2afa 100644
--- a/inference-engine/src/cldnn_engine/ops/scatter_elements_update.cpp
+++ b/inference-engine/src/cldnn_engine/ops/scatter_elements_update.cpp
@@ -54,10 +54,11 @@ void CreateScatterElementsUpdateOp(Program& p, const std::shared_ptr<ngraph::op:
     int32_t axis = axes_constant->cast_vector<int32_t>()[0];
 
     auto primitive = cldnn::scatter_elements_update(layerName,
-                                           inputPrimitives[0],
-                                           inputPrimitives[1],
-                                           inputPrimitives[2],
-                                           GetScatterElementsUpdateAxis(axis, rank));
+                                                    inputPrimitives[0],
+                                                    inputPrimitives[1],
+                                                    inputPrimitives[2],
+                                                    GetScatterElementsUpdateAxis(axis, rank),
+                                                    op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/scatter_nd_update.cpp b/inference-engine/src/cldnn_engine/ops/scatter_nd_update.cpp
index cf5d059772a..525cccfc32e 100644
--- a/inference-engine/src/cldnn_engine/ops/scatter_nd_update.cpp
+++ b/inference-engine/src/cldnn_engine/ops/scatter_nd_update.cpp
@@ -19,10 +19,11 @@ void CreateScatterNDUpdateOp(Program& p, const std::shared_ptr<ngraph::op::v3::S
     auto indices_rank = op->get_input_shape(1).size();
 
     auto primitive = cldnn::scatter_nd_update(layerName,
-                                           inputPrimitives[0],
-                                           inputPrimitives[1],
-                                           inputPrimitives[2],
-                                           indices_rank);
+                                              inputPrimitives[0],
+                                              inputPrimitives[1],
+                                              inputPrimitives[2],
+                                              indices_rank,
+                                              op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/scatter_update.cpp b/inference-engine/src/cldnn_engine/ops/scatter_update.cpp
index c6fb4e9c0aa..913ed452b5f 100644
--- a/inference-engine/src/cldnn_engine/ops/scatter_update.cpp
+++ b/inference-engine/src/cldnn_engine/ops/scatter_update.cpp
@@ -57,7 +57,8 @@ void CreateScatterUpdateOp(Program& p, const std::shared_ptr<ngraph::op::v3::Sca
                                            inputPrimitives[0],
                                            inputPrimitives[1],
                                            inputPrimitives[2],
-                                           GetScatterUpdateAxis(axis, rank));
+                                           GetScatterUpdateAxis(axis, rank),
+                                           op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/select.cpp b/inference-engine/src/cldnn_engine/ops/select.cpp
index 6b3866ac5db..b47a04b5e56 100644
--- a/inference-engine/src/cldnn_engine/ops/select.cpp
+++ b/inference-engine/src/cldnn_engine/ops/select.cpp
@@ -40,7 +40,13 @@ void CreateSelectOp(Program& p, const std::shared_ptr<ngraph::op::v1::Select>& o
             if (targetFormat.value != DefaultFormatForDims(inputDimsN).value) {
                 auto reorderName = layerName + "_cldnn_in" + std::to_string(i) + "_reorder";
                 auto targetDatatype = DataTypeFromPrecision(op->get_input_element_type(i));
-                auto reorderPrim = cldnn::reorder(reorderName, inputPrimitives[i], targetFormat, targetDatatype);
+                auto reorderPrim = cldnn::reorder(reorderName,
+                                                  inputPrimitives[i],
+                                                  targetFormat,
+                                                  targetDatatype,
+                                                  std::vector<float>(),
+                                                  cldnn::reorder_mean_mode::subtract,
+                                                  op->get_friendly_name());
 
                 p.AddPrimitive(reorderPrim);
                 p.AddInnerPrimitiveToProfiler(reorderName, layerName, op);
@@ -57,7 +63,7 @@ void CreateSelectOp(Program& p, const std::shared_ptr<ngraph::op::v1::Select>& o
 
                 auto targetShape = CldnnTensorFromIEDims(inputDims);
 
-                auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape);
+                auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape, op->get_friendly_name());
 
                 p.AddPrimitive(reshapePrim);
                 p.AddInnerPrimitiveToProfiler(reshapeName, layerName, op);
@@ -73,6 +79,7 @@ void CreateSelectOp(Program& p, const std::shared_ptr<ngraph::op::v1::Select>& o
                                     inputPrimitives[0],
                                     inputPrimitives[1],
                                     inputPrimitives[2],
+                                    op->get_friendly_name(),
                                     cldnn::padding(),
                                     bc_string);
 
diff --git a/inference-engine/src/cldnn_engine/ops/shuffle_channels.cpp b/inference-engine/src/cldnn_engine/ops/shuffle_channels.cpp
index f3066ace26a..42976ffbc37 100644
--- a/inference-engine/src/cldnn_engine/ops/shuffle_channels.cpp
+++ b/inference-engine/src/cldnn_engine/ops/shuffle_channels.cpp
@@ -36,7 +36,8 @@ void CreateShuffleChannelsOp(Program& p, const std::shared_ptr<ngraph::op::v0::S
     auto shuffleChannelsPrim = cldnn::shuffle_channels(layerName,
                                                        inputPrimitives[0],
                                                        group,
-                                                       axis);
+                                                       axis,
+                                                       op->get_friendly_name());
 
     p.AddPrimitive(shuffleChannelsPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/softmax.cpp b/inference-engine/src/cldnn_engine/ops/softmax.cpp
index cbaffc04acc..c8049e5800e 100644
--- a/inference-engine/src/cldnn_engine/ops/softmax.cpp
+++ b/inference-engine/src/cldnn_engine/ops/softmax.cpp
@@ -41,7 +41,8 @@ void CreateSoftmaxOp(Program& p, const std::shared_ptr<ngraph::op::v1::Softmax>&
     std::string layerName = layer_type_name_ID(op);
     auto softmaxPrim = cldnn::softmax(layerName,
                                       inputPrimitives[0],
-                                      GetSoftmaxAxis(op->get_axis(), op->get_input_shape(0).size()));
+                                      GetSoftmaxAxis(op->get_axis(), op->get_input_shape(0).size()),
+                                      op->get_friendly_name());
     p.AddPrimitive(softmaxPrim);
     p.AddPrimitiveToProfiler(op);
 }
@@ -58,9 +59,10 @@ void CreateLogSoftmaxOp(Program& p, const std::shared_ptr<ngraph::op::v5::LogSof
 
     auto softmaxPrim = cldnn::softmax(layerNameSoftmax,
                                       inputPrimitives[0],
-                                      GetSoftmaxAxis(static_cast<size_t>(axis), op->get_input_shape(0).size()));
+                                      GetSoftmaxAxis(static_cast<size_t>(axis), op->get_input_shape(0).size()),
+                                      op->get_friendly_name());
 
-    auto logPrim = cldnn::activation(layerName, layerNameSoftmax, cldnn::activation_func::log);
+    auto logPrim = cldnn::activation(layerName, layerNameSoftmax, cldnn::activation_func::log, {(0.0F), (0.0F)}, op->get_friendly_name());
 
     p.AddPrimitive(softmaxPrim);
     p.AddPrimitive(logPrim);
diff --git a/inference-engine/src/cldnn_engine/ops/space_to_batch.cpp b/inference-engine/src/cldnn_engine/ops/space_to_batch.cpp
index fa57d178038..2f51da29776 100644
--- a/inference-engine/src/cldnn_engine/ops/space_to_batch.cpp
+++ b/inference-engine/src/cldnn_engine/ops/space_to_batch.cpp
@@ -42,7 +42,8 @@ void CreateSpaceToBatchOp(Program& p, const std::shared_ptr<ngraph::op::v1::Spac
                                                   inputs[0],          // block_shape
                                                   inputs[1],          // crops_begin
                                                   inputs[2],          // crops_end
-                                                  out_size);
+                                                  out_size,
+                                                  op->get_friendly_name());
 
     p.AddPrimitive(batchToSpacePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/space_to_depth.cpp b/inference-engine/src/cldnn_engine/ops/space_to_depth.cpp
index df4a25b4698..ccdb4f6bd39 100644
--- a/inference-engine/src/cldnn_engine/ops/space_to_depth.cpp
+++ b/inference-engine/src/cldnn_engine/ops/space_to_depth.cpp
@@ -27,7 +27,8 @@ void CreateSpaceToDepthOp(Program& p, const std::shared_ptr<ngraph::op::v0::Spac
     auto spaceToDepthPrim = cldnn::space_to_depth(layerName,
                                                   inputPrimitives[0],
                                                   GetDepthMode(op->get_mode()),
-                                                  op->get_block_size());
+                                                  op->get_block_size(),
+                                                  op->get_friendly_name());
 
     p.AddPrimitive(spaceToDepthPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/split.cpp b/inference-engine/src/cldnn_engine/ops/split.cpp
index 33b48c6d17f..247739c274a 100644
--- a/inference-engine/src/cldnn_engine/ops/split.cpp
+++ b/inference-engine/src/cldnn_engine/ops/split.cpp
@@ -40,8 +40,7 @@ void CreateCommonSplitOp(Program& p, const std::shared_ptr<ngraph::Node>& op) {
         auto outTensor = CldnnTensorFromIEDims(outLayerDims, 1);
         auto offsetTensor = CldnnTensorFromIEDims(startOffset, 0);
 
-        auto cropPrim = cldnn::crop(outLayerName, inputPrimitives[0], outTensor, offsetTensor);
-        p.primitivesToIRLayersMap[outLayerName] = { op->get_friendly_name() };
+        auto cropPrim = cldnn::crop(outLayerName, inputPrimitives[0], outTensor, offsetTensor, op->get_friendly_name());
         p.primitiveIDs[outLayerName] = outLayerName;
 
         p.AddPrimitive(cropPrim);
diff --git a/inference-engine/src/cldnn_engine/ops/strided_slice.cpp b/inference-engine/src/cldnn_engine/ops/strided_slice.cpp
index 8c796290a74..695612b073f 100644
--- a/inference-engine/src/cldnn_engine/ops/strided_slice.cpp
+++ b/inference-engine/src/cldnn_engine/ops/strided_slice.cpp
@@ -189,7 +189,7 @@ void CreateStridedSliceOp(Program& p, const std::shared_ptr<ngraph::op::v1::Stri
         if (!new_axis_mask.empty()) {
             auto targetShape = CldnnTensorFromIEDims(reshape_pattern);
             auto reshapeInName = op->get_friendly_name() + "/Reshape_before";
-            auto reshapePrim = cldnn::reshape(reshapeInName, inputPrimitives[0], targetShape);
+            auto reshapePrim = cldnn::reshape(reshapeInName, inputPrimitives[0], targetShape, op->get_friendly_name());
             p.AddPrimitive(reshapePrim);
             p.AddInnerPrimitiveToProfiler(reshapeInName, layerName, op);
             inPrimitive = reshapeInName;
@@ -215,7 +215,7 @@ void CreateStridedSliceOp(Program& p, const std::shared_ptr<ngraph::op::v1::Stri
         cldnn::tensor offSize = CldnnTensorFromIEDims(offset, 0);
 
 
-        auto cropPrim = cldnn::crop(layerName, inPrimitive, refSize, offSize);
+        auto cropPrim = cldnn::crop(layerName, inPrimitive, refSize, offSize, op->get_friendly_name());
         p.AddPrimitive(cropPrim);
         p.AddPrimitiveToProfiler(layerName, op);
 
@@ -223,7 +223,7 @@ void CreateStridedSliceOp(Program& p, const std::shared_ptr<ngraph::op::v1::Stri
         if (!shrink_axis_mask.empty()) {
             auto targetShape = CldnnTensorFromIEDims(output_shape);
             auto reshapeOutName = op->get_friendly_name() + "/Crop";
-            auto reshapePrim = cldnn::reshape(reshapeOutName, layerName, targetShape);
+            auto reshapePrim = cldnn::reshape(reshapeOutName, layerName, targetShape, op->get_friendly_name());
             p.AddPrimitive(reshapePrim);
             p.AddInnerPrimitiveToProfiler(reshapeOutName, layerName, op);
         }
@@ -258,7 +258,8 @@ void CreateStridedSliceOp(Program& p, const std::shared_ptr<ngraph::op::v1::Stri
                                                  end_mask,
                                                  new_axis_mask,
                                                  shrink_axis_mask,
-                                                 out_size);
+                                                 out_size,
+                                                 op->get_friendly_name());
 
     p.AddPrimitive(stridedSlicePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/tensor_iterator.cpp b/inference-engine/src/cldnn_engine/ops/tensor_iterator.cpp
index d9843481979..53fb5939ccb 100644
--- a/inference-engine/src/cldnn_engine/ops/tensor_iterator.cpp
+++ b/inference-engine/src/cldnn_engine/ops/tensor_iterator.cpp
@@ -27,11 +27,11 @@ using TensorIterator = ngraph::op::v0::TensorIterator;
 namespace CLDNNPlugin {
 
 template<class DATA_TYPE>
-static DATA_TYPE CreateScalarData(Program &p, const cldnn::primitive_id& id, int64_t num) {
+static DATA_TYPE CreateScalarData(Program &p, const cldnn::primitive_id& id, int64_t num, const cldnn::primitive_id& ext_prim_id) {
     auto mem = p.GetEngine().allocate_memory({ cldnn::data_types::i64, cldnn::format::bfyx, { 1, 1, 1, 1 } });
     cldnn::mem_lock<int64_t> ptr{mem, p.GetEngine().get_program_stream()};
     *ptr.begin() = num;
-    return {id, mem};
+    return {id, mem, ext_prim_id};
 }
 
 static cldnn::mutable_data CreateAdditionalOutputData(Program &p, const std::shared_ptr<ngraph::Node>& op,
@@ -42,7 +42,7 @@ static cldnn::mutable_data CreateAdditionalOutputData(Program &p, const std::sha
     const auto tensor = CldnnTensorFromIEDims(op->get_output_shape(output_idx));
     cldnn::layout output_layout = cldnn::layout(precision, format, tensor);
     auto mem = p.GetEngine().allocate_memory(output_layout);
-    auto md = cldnn::mutable_data(id, {input}, mem); // cldnn::data cannot set dependency
+    auto md = cldnn::mutable_data(id, {input}, mem, op->get_friendly_name()); // cldnn::data cannot set dependency
     return md;
 }
 
@@ -122,24 +122,21 @@ void CreateTensorIteratorOp(Program &p, const std::shared_ptr<TensorIterator> &o
         throw std::runtime_error("tensor iterator's num_iteration cannot be negative");
     }
     {
-        cldnn::data trip_count = CreateScalarData<cldnn::data>(p, trip_count_id, num_iterations);
-        p.primitivesToIRLayersMap[trip_count_id] = { op->get_friendly_name() };
+        cldnn::data trip_count = CreateScalarData<cldnn::data>(p, trip_count_id, num_iterations, op->get_friendly_name());
         p.primitiveIDs[trip_count_id] = trip_count_id;
         p.AddPrimitive(trip_count);
         p.AddInnerPrimitiveToProfiler(trip_count_id, layerName, op);
     }
     const cldnn::primitive_id execution_condition_id = layerName + "_initialExecutionCondition";
     {
-        cldnn::mutable_data execution_condition = CreateScalarData<cldnn::mutable_data>(p, execution_condition_id, 1);
-        p.primitivesToIRLayersMap[execution_condition_id] = { op->get_friendly_name() };
+        cldnn::mutable_data execution_condition = CreateScalarData<cldnn::mutable_data>(p, execution_condition_id, 1, op->get_friendly_name());
         p.primitiveIDs[execution_condition_id] = execution_condition_id;
         p.AddPrimitive(execution_condition);
         p.AddInnerPrimitiveToProfiler(execution_condition_id, layerName, op);
     }
     const cldnn::primitive_id num_iteration_id = layerName + "_numIteration";
     {
-        cldnn::mutable_data num_iteration = CreateScalarData<cldnn::mutable_data>(p, num_iteration_id, 0);
-        p.primitivesToIRLayersMap[num_iteration_id] = { op->get_friendly_name() };
+        cldnn::mutable_data num_iteration = CreateScalarData<cldnn::mutable_data>(p, num_iteration_id, 0, op->get_friendly_name());
         p.primitiveIDs[num_iteration_id] = num_iteration_id;
         p.AddPrimitive(num_iteration);
         p.AddInnerPrimitiveToProfiler(num_iteration_id, layerName, op);
@@ -191,7 +188,10 @@ void CreateTensorIteratorOp(Program &p, const std::shared_ptr<TensorIterator> &o
         input_primitive_maps,         /* input mappings connecting outer network and inner network */
         output_primitive_maps,        /* output mappings connecting outer network and inner network */
         back_edges,             /* back edge mapping */
-        num_iterations);        /* max iteration, i.e. length of iteration axis */
+        num_iterations,         /* max iteration, i.e. length of iteration axis */
+        "",
+        "",
+        op->get_friendly_name());
 
     p.AddPrimitive(loopPrimitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/tile.cpp b/inference-engine/src/cldnn_engine/ops/tile.cpp
index aa91fbd3d5a..4d35ff0c647 100644
--- a/inference-engine/src/cldnn_engine/ops/tile.cpp
+++ b/inference-engine/src/cldnn_engine/ops/tile.cpp
@@ -18,7 +18,8 @@ void CreateTileOp(Program& p, const std::shared_ptr<ngraph::op::v0::Tile>& op) {
 
     auto tilePrim = cldnn::tile(layerName,
                                 inputPrimitives[0],
-                                CldnnTensorFromIEDims(op->get_output_shape(0)));
+                                CldnnTensorFromIEDims(op->get_output_shape(0)),
+                                op->get_friendly_name());
 
     p.AddPrimitive(tilePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/topk.cpp b/inference-engine/src/cldnn_engine/ops/topk.cpp
index 3d8f7e6521a..fe9ae95550b 100644
--- a/inference-engine/src/cldnn_engine/ops/topk.cpp
+++ b/inference-engine/src/cldnn_engine/ops/topk.cpp
@@ -9,6 +9,7 @@
 
 #include "cldnn/primitives/arg_max_min.hpp"
 #include "cldnn/primitives/mutable_data.hpp"
+#include "cldnn/runtime/debug_configuration.hpp"
 
 namespace CLDNNPlugin {
 
@@ -71,11 +72,16 @@ void CreateTopKOp(Program& p, const std::shared_ptr<ngraph::op::v1::TopK>& op) {
                                                     DefaultFormatForDims(op->get_output_shape(1).size()),
                                                     CldnnTensorFromIEDims(op->get_output_shape(1)));
 
+        GPU_DEBUG_GET_INSTANCE(debug_config);
+        GPU_DEBUG_IF(debug_config->verbose >= 2) {
+            GPU_DEBUG_COUT << "[" << layer_type_name_ID(op) << ": mutable data]" << std::endl;
+        }
         auto shared_memory = p.GetEngine().allocate_memory(mutableLayout);
 
         cldnn::primitive_id argmax_mutable_id_w = layer_type_name_ID(op) + "_md_write";
-        auto argmax_mutable_prim = cldnn::mutable_data(argmax_mutable_id_w, shared_memory);
-        p.primitivesToIRLayersMap[argmax_mutable_id_w] = {op->get_friendly_name()};
+        auto argmax_mutable_prim = cldnn::mutable_data(argmax_mutable_id_w,
+                                                       shared_memory,
+                                                       op->get_friendly_name());
         p.primitiveIDs[argmax_mutable_id_w] = argmax_mutable_id_w;
         p.AddPrimitive(argmax_mutable_prim);
         inputPrimitives.push_back(argmax_mutable_id_w);
@@ -88,14 +94,17 @@ void CreateTopKOp(Program& p, const std::shared_ptr<ngraph::op::v1::TopK>& op) {
                                              chosen_axis,
                                              stype,
                                              true,
+                                             op->get_friendly_name(),
                                              cldnn::padding({0, 0, 0, 0}, 0),
                                              DataTypeFromPrecision(op->get_output_element_type(0)));
 
         p.AddPrimitive(argmaxPrim);
 
         cldnn::primitive_id argmax_mutable_id_r = layerName + ".1";
-        auto argmax_mutable_prim_r = cldnn::mutable_data(argmax_mutable_id_r, {ArgMaxLayerName}, shared_memory);
-        p.primitivesToIRLayersMap[argmax_mutable_id_r] = {op->get_friendly_name()};
+        auto argmax_mutable_prim_r = cldnn::mutable_data(argmax_mutable_id_r,
+                                                         { ArgMaxLayerName },
+                                                         shared_memory,
+                                                         op->get_friendly_name());
         p.primitiveIDs[argmax_mutable_id_r] = argmax_mutable_id_r;
         p.AddPrimitive(argmax_mutable_prim_r);
         p.InitProfileInfo(ArgMaxLayerName, layer_type_lower(op));
@@ -108,6 +117,7 @@ void CreateTopKOp(Program& p, const std::shared_ptr<ngraph::op::v1::TopK>& op) {
                                              chosen_axis,
                                              stype,
                                              true,
+                                             op->get_friendly_name(),
                                              cldnn::padding({0, 0, 0, 0}, 0),
                                              DataTypeFromPrecision(op->get_output_element_type(0)));
 
diff --git a/inference-engine/src/cldnn_engine/ops/transpose.cpp b/inference-engine/src/cldnn_engine/ops/transpose.cpp
index f5de62923a2..c2bf2e943d3 100644
--- a/inference-engine/src/cldnn_engine/ops/transpose.cpp
+++ b/inference-engine/src/cldnn_engine/ops/transpose.cpp
@@ -37,7 +37,8 @@ void CreateTransposeOp(Program& p, const std::shared_ptr<ngraph::op::v1::Transpo
 
     auto permutePrim = cldnn::permute(layerName,
                                       inputPrimitives[0],
-                                      cldnn_permute_order);
+                                      cldnn_permute_order,
+                                      op->get_friendly_name());
 
     p.AddPrimitive(permutePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/unary.cpp b/inference-engine/src/cldnn_engine/ops/unary.cpp
index 9a277a8be2a..ecab7600ade 100644
--- a/inference-engine/src/cldnn_engine/ops/unary.cpp
+++ b/inference-engine/src/cldnn_engine/ops/unary.cpp
@@ -49,7 +49,7 @@ void CreateUnaryEltwiseOp(Program& p, const std::shared_ptr<ngraph::Node>& op,
                           cldnn::activation_func func, cldnn::activation_additional_params params) {
     auto inputs = p.GetInputPrimitiveIDs(op);
     std::string layerName = layer_type_name_ID(op);
-    auto activationPrimitive = cldnn::activation(layerName, inputs[0], func, params);
+    auto activationPrimitive = cldnn::activation(layerName, inputs[0], func, params, op->get_friendly_name());
     p.AddPrimitive(activationPrimitive);
     p.AddPrimitiveToProfiler(op);
 }
@@ -86,7 +86,11 @@ void CreatePReluOp(Program& p, const std::shared_ptr<ngraph::op::v0::PRelu>& op)
     } else if (out_shape.size() >= 2 && ngraph::shape_size(slope_shape) == out_shape[1]) {
         auto inputs = p.GetInputPrimitiveIDs(op);
         std::string layerName = layer_type_name_ID(op);
-        auto activationPrimitive = cldnn::activation(layerName, inputs[0], inputs[1], cldnn::activation_func::relu_negative_slope);
+        auto activationPrimitive = cldnn::activation(layerName,
+                                                     inputs[0],
+                                                     inputs[1],
+                                                     cldnn::activation_func::relu_negative_slope,
+                                                     op->get_friendly_name());
         p.AddPrimitive(activationPrimitive);
         p.AddPrimitiveToProfiler(op);
     }
diff --git a/inference-engine/src/gna_plugin/CMakeLists.txt b/inference-engine/src/gna_plugin/CMakeLists.txt
index f90cfce5c8a..a476318dc03 100644
--- a/inference-engine/src/gna_plugin/CMakeLists.txt
+++ b/inference-engine/src/gna_plugin/CMakeLists.txt
@@ -38,9 +38,6 @@ ie_add_plugin(NAME ${TARGET_NAME}
 # Enable support of CC for the plugin
 ie_mark_target_as_cc(${TARGET_NAME})
 
-# saving rpath to GNA shared library be used by CI
-log_rpath_from_dir(GNA ${libGNA_LIBRARIES_BASE_PATH})
-
 target_link_libraries(${TARGET_NAME} PRIVATE inference_engine inference_engine_legacy inference_engine_transformations
         Threads::Threads libGNA)
 target_include_directories(${TARGET_NAME} PRIVATE ${CMAKE_CURRENT_SOURCE_DIR})
diff --git a/inference-engine/src/gna_plugin/backend/dnn_types.h b/inference-engine/src/gna_plugin/backend/dnn_types.h
index 0b00b41ec83..499f8a7dd84 100644
--- a/inference-engine/src/gna_plugin/backend/dnn_types.h
+++ b/inference-engine/src/gna_plugin/backend/dnn_types.h
@@ -201,18 +201,6 @@ enum OvGnaType {
     OvGnaTypePwl = 8,
 };
 
-#if GNA_LIB_VER == 2
-enum OvGnaMode {
-    OvGnaModeDefault = 0,
-    OvGnaModeDisabled = -1
-};
-
-struct OvGnaTensor {
-    std::vector<uint32_t> dimensions;
-    OvGnaType type;
-    OvGnaMode mode;
-};
-
 template <class T>
 OvGnaType OvGnaTypeIntFromBytes(T bytesPerElement) {
     static const std::map<T, OvGnaType> m = {
@@ -227,6 +215,18 @@ OvGnaType OvGnaTypeIntFromBytes(T bytesPerElement) {
     return r->second;
 }
 
+#if GNA_LIB_VER == 2
+enum OvGnaMode {
+    OvGnaModeDefault = 0,
+    OvGnaModeDisabled = -1
+};
+
+struct OvGnaTensor {
+    std::vector<uint32_t> dimensions;
+    OvGnaType type;
+    OvGnaMode mode;
+};
+
 inline std::string OvGnaTypeToString(OvGnaType type) {
     static const std::map<OvGnaType, std::string> typeToString = {
         {OvGnaTypeInt8, "OvGnaTypeInt8"},
diff --git a/inference-engine/src/gna_plugin/backend/gna_limitations.cpp b/inference-engine/src/gna_plugin/backend/gna_limitations.cpp
index 34fd7534ba6..e4f9aa423f1 100644
--- a/inference-engine/src/gna_plugin/backend/gna_limitations.cpp
+++ b/inference-engine/src/gna_plugin/backend/gna_limitations.cpp
@@ -94,23 +94,36 @@ std::string VectorOrSquareLimitByChannelsAndPrecision::GetErrorOrEmpty(const uin
     return GetByPrecision(precision).GetErrorOrEmpty(h, w, channels, what);
 }
 
-void Validator::ValidateCnn2D(std::string name, const uint32_t inHeight, const uint32_t inWidth,
-    const uint32_t inChannels, const uint32_t kH, const uint32_t kW, const uint32_t kN,
-    const uint32_t strideH, const uint32_t strideW, OvGnaType inPrecision) const {
+bool Validator::ValidateCnn2D(std::string name, const uint32_t inHeight, const uint32_t inWidth,
+    const uint32_t inChannels, const uint32_t kernelH, const uint32_t kernelW, const uint32_t kernelN,
+    const uint32_t strideH, const uint32_t strideW, const uint32_t dilationH, const uint32_t dilationW,
+    OvGnaType inPrecision, bool exception) const {
     const std::string prefix = "Layer Convolution2D: " + name + ":";
     auto error = inputHWLimit.GetErrorOrEmpty(inHeight, inWidth);
 
-    error += kernelNumberLimit.GetErrorOrEmpty(kN);
-
+    error += kernelNumberLimit.GetErrorOrEmpty(kernelN);
     error += inputChannelsNumberLimit.GetErrorOrEmpty(inChannels);
-    error += kernelLimit.GetErrorOrEmpty(kH, kW, inPrecision, inChannels, "kernel");
+    error += kernelLimit.GetErrorOrEmpty(kernelH, kernelW, inPrecision, inChannels, "kernel");
     error += strideLimit.GetErrorOrEmpty(strideH, strideW, inPrecision, inChannels, "convolution stride");
-    ThrowIfNotEmpty(prefix, error);
+
+    const RangeLimit kernelStrideHLimit{1, kernelH, "kernel stride height (must be up to kernel height)"};
+    const RangeLimit kernelStrideWLimit{1, kernelW, "kernel stride width (must be up to kernel width)"};
+
+    error += kernelStrideHLimit.GetErrorOrEmpty(strideH);
+    error += kernelStrideWLimit.GetErrorOrEmpty(strideW);
+
+    error += dilationLimit.GetErrorOrEmpty(dilationH, dilationW);
+
+    if (exception)
+        ThrowIfNotEmpty(prefix, error);
+
+    return error.empty() ? true : false;
 }
 
-void Validator::ValidatePooling2D(std::string name,
+bool Validator::ValidatePooling2D(std::string name,
     const uint32_t windowH, const uint32_t windowW,
-    const uint32_t strideH, const uint32_t strideW) const {
+    const uint32_t strideH, const uint32_t strideW,
+    bool exception) const {
     const std::string prefix = "Layer Pooling2D: " + name + ":";
 
     auto error = poolingWindowLimit.GetErrorOrEmpty(windowH, windowW, "pooling window");
@@ -120,7 +133,10 @@ void Validator::ValidatePooling2D(std::string name,
     error += poolingStrideHLimit.GetErrorOrEmpty(strideH);
     error += poolingStrideWLimit.GetErrorOrEmpty(strideW);
 
-    ThrowIfNotEmpty(prefix, error);
+    if (exception)
+        ThrowIfNotEmpty(prefix, error);
+
+    return error.empty() ? true : false;
 }
 
 void Validator::ThrowIfNotEmpty(const std::string prefix, const std::string error) {
diff --git a/inference-engine/src/gna_plugin/backend/gna_limitations.hpp b/inference-engine/src/gna_plugin/backend/gna_limitations.hpp
index 5aa036c1559..20ea461494a 100644
--- a/inference-engine/src/gna_plugin/backend/gna_limitations.hpp
+++ b/inference-engine/src/gna_plugin/backend/gna_limitations.hpp
@@ -16,6 +16,8 @@ constexpr uint32_t bufferMaxSize = 65528;
 
 constexpr uint32_t convMinFiltersNum = 4;
 constexpr uint32_t convMaxFiltersNum = 65532;
+constexpr uint32_t convDilationHeight = 1;
+constexpr uint32_t convDilationWidth = 1;
 constexpr uint32_t convFiltersNumDivider = 4;
 constexpr uint32_t convFilterSizeDivider = 8;
 constexpr uint32_t convFilterMaxSize = 768;
@@ -97,19 +99,24 @@ class Validator {
         { 240, { 3, 7, 3 }, { 2, 7, 2 } },
         { 120, { 3, 7, 3 }, { 1, 7, 1 } } };
     VectorOrSquareLimitByChannelsAndPrecision& strideLimit = kernelLimit;
+    RangeLimit2D dilationLimit{ {convDilationHeight, convDilationHeight, "dilation height" },
+        { convDilationWidth, convDilationWidth, "dilation width" } };
     const VectorOrSquareLimit poolingWindowLimit{ 3, 1, 1 };
 
     static void ThrowIfNotEmpty(const std::string prefix, const std::string error);
+
 public:
     Validator() = default;
 
-    void ValidateCnn2D(std::string name, const uint32_t inHeight, const uint32_t inWidth,
-        const uint32_t inChannels, const uint32_t kH, const uint32_t kW, const uint32_t kN,
-        const uint32_t strideH, const uint32_t strideW, OvGnaType inPrecision) const;
+    bool ValidateCnn2D(std::string name, const uint32_t inHeight, const uint32_t inWidth,
+        const uint32_t inChannels, const uint32_t kernelH, const uint32_t kernelW, const uint32_t kernelN,
+        const uint32_t strideH, const uint32_t strideW, const uint32_t dilationH, const uint32_t dilationW,
+        OvGnaType inPrecision, bool exception = true) const;
 
-    void ValidatePooling2D(std::string name,
+    bool ValidatePooling2D(std::string name,
         const uint32_t windowH, const uint32_t windowW,
-        const uint32_t strideH, const uint32_t strideW) const;
+        const uint32_t strideH, const uint32_t strideW,
+        bool exception = true) const;
 };
 } // namespace Cnn2D
 
diff --git a/inference-engine/src/gna_plugin/gna2_model_export_helper.cpp b/inference-engine/src/gna_plugin/gna2_model_export_helper.cpp
index 373ceca5f35..1b126bdbd89 100644
--- a/inference-engine/src/gna_plugin/gna2_model_export_helper.cpp
+++ b/inference-engine/src/gna_plugin/gna2_model_export_helper.cpp
@@ -9,19 +9,21 @@
 #include "gna2-model-export-api.h"
 #include "gna2-model-suecreek-header.h"
 #include "gna_api_wrapper.hpp"
+#include "gna2-device-api.h"
 
 #include <cstdint>
 #include <fstream>
 
 void * ExportSueLegacyUsingGnaApi2(
     uint32_t modelId,
+    uint32_t deviceIndex,
     Gna2ModelSueCreekHeader* modelHeader) {
 
     uint32_t exportConfig;
     auto status = Gna2ModelExportConfigCreate(gnaUserAllocatorAlignedPage, &exportConfig);
     GNADeviceHelper::checkGna2Status(status, "Gna2ModelExportConfigCreate");
 
-    status = Gna2ModelExportConfigSetSource(exportConfig, 0, modelId);
+    status = Gna2ModelExportConfigSetSource(exportConfig, deviceIndex, modelId);
     GNADeviceHelper::checkGna2Status(status, "Gna2ModelExportConfigSetSource");
     status = Gna2ModelExportConfigSetTarget(exportConfig, Gna2DeviceVersionEmbedded1_0);
     GNADeviceHelper::checkGna2Status(status, "Gna2ModelExportConfigSetTarget");
diff --git a/inference-engine/src/gna_plugin/gna2_model_export_helper.hpp b/inference-engine/src/gna_plugin/gna2_model_export_helper.hpp
index e2d1e29898e..564f9eaf8fe 100644
--- a/inference-engine/src/gna_plugin/gna2_model_export_helper.hpp
+++ b/inference-engine/src/gna_plugin/gna2_model_export_helper.hpp
@@ -14,6 +14,7 @@
 
 void * ExportSueLegacyUsingGnaApi2(
     uint32_t modelId,
+    uint32_t deviceIndex,
     Gna2ModelSueCreekHeader* modelHeader);
 
 void ExportLdForDeviceVersion(
diff --git a/inference-engine/src/gna_plugin/gna_device.cpp b/inference-engine/src/gna_plugin/gna_device.cpp
index af561cc0c47..a9bd9eec15e 100644
--- a/inference-engine/src/gna_plugin/gna_device.cpp
+++ b/inference-engine/src/gna_plugin/gna_device.cpp
@@ -170,13 +170,9 @@ void GNADeviceHelper::releaseModel(const uint32_t model_id) {
 
 bool GNADeviceHelper::enforceLegacyCnnNeeded() const {
     const auto compileTargetDevice = getTargetDevice(false);
-    return isGnaLibVersion2_1 && isUpTo20HwGnaDevice(compileTargetDevice);
+    return (isGnaLibVersion3_0 || isGnaLibVersion2_1) && isUpTo20HwGnaDevice(compileTargetDevice);
 }
 
-namespace {
-    const volatile auto Gna2DeviceVersion3_0 = static_cast<Gna2DeviceVersion>(0x30);
-} // namespace
-
 Gna2DeviceVersion GNADeviceHelper::parseDeclaredTarget(std::string target, const bool execTarget) const {
     auto parsed = Gna2DeviceVersion2_0;
     auto throwUnsupportedGnaTarget = [&](std::string extraSuffix) {
@@ -184,7 +180,7 @@ Gna2DeviceVersion GNADeviceHelper::parseDeclaredTarget(std::string target, const
         THROW_GNA_EXCEPTION << "Unsupported " << key << " = \"" << target << "\"" << extraSuffix;
     };
     if (target == InferenceEngine::GNAConfigParams::GNA_TARGET_3_0) {
-        if (!isGnaLibVersion2_1)
+        if (!isGnaLibVersion2_1 && !isGnaLibVersion3_0)
             throwUnsupportedGnaTarget(", when GNA Library version is 2.0.X.Y");
         parsed = Gna2DeviceVersion3_0;
     } else if (target != InferenceEngine::GNAConfigParams::GNA_TARGET_2_0) {
@@ -195,7 +191,7 @@ Gna2DeviceVersion GNADeviceHelper::parseDeclaredTarget(std::string target, const
 
 Gna2DeviceVersion GNADeviceHelper::getDefaultTarget() const {
     if (detectedGnaDevVersion == Gna2DeviceVersionSoftwareEmulation)
-        return isGnaLibVersion2_1 ? Gna2DeviceVersion3_0 : Gna2DeviceVersion2_0;
+        return (isGnaLibVersion3_0 ||  isGnaLibVersion2_1) ? Gna2DeviceVersion3_0 : Gna2DeviceVersion2_0;
     return detectedGnaDevVersion;
 }
 
@@ -213,14 +209,6 @@ uint32_t GNADeviceHelper::createRequestConfig(const uint32_t model_id) {
     auto status = Gna2RequestConfigCreate(model_id, &reqConfId);
     checkGna2Status(status, "Gna2RequestConfigCreate");
 
-    // When the GNA_SW_EXACT mode is chosen inference results should be computed exactly the same way
-    // (bit exactly) as on the selected GNA execution target generation.
-    // See the GNA Plugin's GNA_EXEC_TARGET config option description.
-    if (swExactMode) {
-        const auto consistentDevice = getTargetDevice(true);
-        status = Gna2RequestConfigEnableHardwareConsistency(reqConfId, consistentDevice);
-        checkGna2Status(status, "Gna2RequestConfigEnableHardwareConsistency(" + std::to_string(static_cast<long>(consistentDevice)) + ")");
-    }
     status = Gna2InstrumentationConfigAssignToRequestConfig(instrumentationConfigId, reqConfId);
     checkGna2Status(status, "Gna2InstrumentationConfigAssignToRequestConfig");
 
@@ -454,7 +442,7 @@ GNADeviceHelper::DumpResult GNADeviceHelper::dumpXnn(const uint32_t modelId) {
     checkStatus();
 #else
     r.model.reset(
-        ExportSueLegacyUsingGnaApi2(modelId, &r.header),
+        ExportSueLegacyUsingGnaApi2(modelId, nGnaDeviceIndex, &r.header),
         gnaUserFree);
 #endif
 
@@ -473,7 +461,7 @@ void GNADeviceHelper::dumpXnnForDeviceVersion(
     const Gna2DeviceVersion targetDeviceVersion) {
 
     Gna2ModelSueCreekHeader sueHeader;
-    auto ptr = ExportSueLegacyUsingGnaApi2(modelId, &sueHeader);
+    auto ptr = ExportSueLegacyUsingGnaApi2(modelId, nGnaDeviceIndex, &sueHeader);
     gnaUserFree(ptr);
 
     ExportGnaDescriptorPartiallyFilled(sueHeader.NumberOfLayers, outStream);
@@ -506,8 +494,15 @@ void GNADeviceHelper::open(uint8_t n_threads) {
 #else
     auto status = Gna2DeviceGetVersion(nGnaDeviceIndex, &detectedGnaDevVersion);
     checkGna2Status(status, "Gna2DeviceGetVersion");
-    status = Gna2DeviceOpen(nGnaDeviceIndex);
-    checkGna2Status(status, "Gna2DeviceOpen");
+
+    if (useDeviceEmbeddedExport) {
+        status = Gna2DeviceCreateForExport(exportGeneration, &nGnaDeviceIndex);
+        GNADeviceHelper::checkGna2Status(status, "Gna2DeviceCreateForExport");
+    } else {
+        status = Gna2DeviceOpen(nGnaDeviceIndex);
+        checkGna2Status(status, "Gna2DeviceOpen");
+    }
+
     // TODO: GNA2: uncomment when scratchpad repaired
     // status = Gna2DeviceSetNumberOfThreads(nGnaDeviceIndex, n_threads);
     // checkGna2Status(status);
diff --git a/inference-engine/src/gna_plugin/gna_device.hpp b/inference-engine/src/gna_plugin/gna_device.hpp
index 4983ce0d2e0..5e6719607d6 100644
--- a/inference-engine/src/gna_plugin/gna_device.hpp
+++ b/inference-engine/src/gna_plugin/gna_device.hpp
@@ -55,7 +55,10 @@ class GNADeviceHelper {
     Gna2DeviceVersion detectedGnaDevVersion = Gna2DeviceVersionSoftwareEmulation;
     std::string executionTarget;
     std::string compileTarget;
+    bool useDeviceEmbeddedExport = false;
+    Gna2DeviceVersion exportGeneration = Gna2DeviceVersionEmbedded1_0;
     bool isGnaLibVersion2_1 = false;
+    bool isGnaLibVersion3_0 = false;
 
     static const uint32_t TotalGna2InstrumentationPoints = 2;
     Gna2InstrumentationPoint gna2InstrumentationPoints[TotalGna2InstrumentationPoints] = {
@@ -82,12 +85,16 @@ public:
          bool swExactModeIn = false,
          uint8_t lib_async_n_threads = 1,
          bool use_openmp = false,
-         bool isPerformanceMeasuring = false) :
+         bool isPerformanceMeasuring = false,
+         bool deviceEmbedded = false,
+         int deviceVersionParsed = 0) :
          swExactMode(swExactModeIn),
          executionTarget(executionTargetIn),
          compileTarget(compileTargetIn),
          isPerformanceMeasuring(isPerformanceMeasuring),
-         nGnaDeviceIndex{selectGnaDevice()} {
+         nGnaDeviceIndex{selectGnaDevice()},
+         useDeviceEmbeddedExport(deviceEmbedded),
+         exportGeneration(static_cast<Gna2DeviceVersion>(deviceVersionParsed)) {
 #endif
         open(lib_async_n_threads);
         initGnaPerfCounters();
@@ -98,6 +105,9 @@ public:
         if (gnaLibVersion.rfind("2.1", 0) == 0) {
             isGnaLibVersion2_1 = true;
         }
+        if (gnaLibVersion.rfind("3.0", 0) == 0) {
+            isGnaLibVersion3_0 = true;
+        }
 #endif
 
         if (use_openmp) {
diff --git a/inference-engine/src/gna_plugin/gna_graph_compiler.cpp b/inference-engine/src/gna_plugin/gna_graph_compiler.cpp
index 8ef6ad8a7a5..9421e5ddecc 100644
--- a/inference-engine/src/gna_plugin/gna_graph_compiler.cpp
+++ b/inference-engine/src/gna_plugin/gna_graph_compiler.cpp
@@ -580,7 +580,8 @@ void GNAGraphCompiler::finalizeConvolution2DPrimitive(InferenceEngine::CNNLayerP
 
     cnn2dValidator.ValidateCnn2D(layer->name,
         in_height, in_width, in_channels,
-        convolution._kernel_y, convolution._kernel_x, filter_n, convolution._stride_y, convolution._stride_x, inputPrec);
+        convolution._kernel_y, convolution._kernel_x, filter_n, convolution._stride_y, convolution._stride_x,
+        convolution._dilation_y, convolution._dilation_x, inputPrec);
 
     float weight_scale_factor = getScaleFactor(layer, QuantizedDataType::weights);
     float output_scale_factor = getScaleFactor(layer, QuantizedDataType::output);
@@ -2577,4 +2578,4 @@ GNAGraphCompiler::transposeMatrix(uint8_t* ptr_matrix, size_t element_size, uint
         }
     }
     return temp_buffer;
-}
\ No newline at end of file
+}
diff --git a/inference-engine/src/gna_plugin/gna_plugin.cpp b/inference-engine/src/gna_plugin/gna_plugin.cpp
index f4e8924f831..55218a38406 100644
--- a/inference-engine/src/gna_plugin/gna_plugin.cpp
+++ b/inference-engine/src/gna_plugin/gna_plugin.cpp
@@ -420,7 +420,9 @@ void GNAPlugin::InitGNADevice() {
                 config.swExactMode,
                 gnaFlags->gna_lib_async_threads_num,
                 gnaFlags->gna_openmp_multithreading,
-                gnaFlags->performance_counting);
+                gnaFlags->performance_counting,
+                !config.dumpXNNPath.empty(),
+                GetDeviceVersionFromString(config.dumpXNNGeneration));
 #endif
     size_t page_size_bytes = 4096;
     gnamem = std::make_shared<gna_memory_type>(memory::make_polymorph<memory::GNAAllocator>(gnadevice), page_size_bytes);
@@ -706,6 +708,11 @@ void GNAPlugin::LoadNetwork(CNNNetwork & _network) {
         InitGNADevice();
     }
 
+    std::string effectiveGnaCompileTarget = config.gnaCompileTarget;
+    if (gnadevice) {
+        effectiveGnaCompileTarget = gnadevice->getEffectiveGnaCompileTarget();
+    }
+
     bool isNgraphPassesUsed = false;
 
     if (_network.getFunction()) {
@@ -719,11 +726,9 @@ void GNAPlugin::LoadNetwork(CNNNetwork & _network) {
         manager.register_pass<ngraph::pass::LSTMCellDecomposition>();
         manager.register_pass<ConvertDWSCToScaleShifts>();
         manager.register_pass<ConvertPaddedToValidConv>();
-        if (config.gnaCompileTarget == InferenceEngine::GNAConfigParams::GNA_TARGET_2_0) {
-            manager.register_pass<Decompose2DConvTransposedWithBiasAF>();
-            manager.register_pass<Decompose2DConvTransposedWithBias>();
-            manager.register_pass<Decompose2DConv>();
-        }
+        manager.register_pass<Decompose2DConvTransposedWithBiasAF>(effectiveGnaCompileTarget, config.gnaPrecision);
+        manager.register_pass<Decompose2DConvTransposedWithBias>(effectiveGnaCompileTarget, config.gnaPrecision);
+        manager.register_pass<Decompose2DConv>(effectiveGnaCompileTarget, config.gnaPrecision);
         // TODO enable this transformation for networks with convolutions
         if (!ngraph::op::util::has_op_with_type<ngraph::opset7::Convolution>(graph)) {
             manager.register_pass<ConvertMatmulWithFqToPointWiseConvolution>();
@@ -1036,10 +1041,7 @@ void GNAPlugin::LoadNetwork(CNNNetwork & _network) {
 #else
     nnets.emplace_back(make_shared<CPPWrapper<intel_nnet_type_t>>(), -1, InferenceEngine::BlobMap());
 #endif
-    std::string effectiveGnaCompileTarget = config.gnaCompileTarget;
-    if (gnadevice) {
-        effectiveGnaCompileTarget = gnadevice->getEffectiveGnaCompileTarget();
-    }
+
     if (!gnaFlags->sw_fp32 && !graphCompiler.dnnComponents.components.empty()) {
         // number of layer gets calculated inside that InitGNAStruct function
 #if GNA_LIB_VER == 2
diff --git a/inference-engine/src/gna_plugin/transformations/convert_padded_to_valid_convolution.cpp b/inference-engine/src/gna_plugin/transformations/convert_padded_to_valid_convolution.cpp
index f32b9b2da0e..51b9bbfd56c 100644
--- a/inference-engine/src/gna_plugin/transformations/convert_padded_to_valid_convolution.cpp
+++ b/inference-engine/src/gna_plugin/transformations/convert_padded_to_valid_convolution.cpp
@@ -201,20 +201,25 @@ ConvertPaddedToValidConv::ConvertPaddedToValidConv() {
         ngraph::pattern::consumers_count(1));
     auto af1 = ngraph::pattern::wrap_type<ngraph::opset7::Relu, ngraph::opset7::Sigmoid,
         ngraph::opset7::Tanh, ngraph::opset7::Abs, ngraph::opset7::Log, ngraph::opset7::Exp,
-        ngraph::opset7::Sign, ngraph::opset7::Clamp>({bias}, ngraph::pattern::consumers_count(1));
+        ngraph::opset7::Sign, ngraph::opset7::Clamp>({conv}, ngraph::pattern::consumers_count(1));
     auto af2 = ngraph::pattern::wrap_type<ngraph::opset7::Relu, ngraph::opset7::Sigmoid,
         ngraph::opset7::Tanh, ngraph::opset7::Abs, ngraph::opset7::Log, ngraph::opset7::Exp,
-        ngraph::opset7::Sign, ngraph::opset7::Clamp>({fq_bias}, ngraph::pattern::consumers_count(1));
+        ngraph::opset7::Sign, ngraph::opset7::Clamp>({bias}, ngraph::pattern::consumers_count(1));
     auto af3 = ngraph::pattern::wrap_type<ngraph::opset7::Relu, ngraph::opset7::Sigmoid,
         ngraph::opset7::Tanh, ngraph::opset7::Abs, ngraph::opset7::Log, ngraph::opset7::Exp,
-        ngraph::opset7::Sign, ngraph::opset7::Clamp>({max_pool1}, ngraph::pattern::consumers_count(1));
+        ngraph::opset7::Sign, ngraph::opset7::Clamp>({fq_bias}, ngraph::pattern::consumers_count(1));
     auto af4 = ngraph::pattern::wrap_type<ngraph::opset7::Relu, ngraph::opset7::Sigmoid,
+        ngraph::opset7::Tanh, ngraph::opset7::Abs, ngraph::opset7::Log, ngraph::opset7::Exp,
+        ngraph::opset7::Sign, ngraph::opset7::Clamp>({max_pool1}, ngraph::pattern::consumers_count(1));
+    auto af5 = ngraph::pattern::wrap_type<ngraph::opset7::Relu, ngraph::opset7::Sigmoid,
         ngraph::opset7::Tanh, ngraph::opset7::Abs, ngraph::opset7::Log, ngraph::opset7::Exp,
         ngraph::opset7::Sign, ngraph::opset7::Clamp>({max_pool2}, ngraph::pattern::consumers_count(1));
-    auto fq_af = ngraph::pattern::wrap_type<ngraph::opset7::FakeQuantize>({af4, const_input, const_input, const_input, const_input},
+    auto fq_af1 = ngraph::pattern::wrap_type<ngraph::opset7::FakeQuantize>({af3, const_input, const_input, const_input, const_input},
+        ngraph::pattern::consumers_count(1));
+    auto fq_af2 = ngraph::pattern::wrap_type<ngraph::opset7::FakeQuantize>({af5, const_input, const_input, const_input, const_input},
         ngraph::pattern::consumers_count(1));
     auto transpose_input =
-        std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{conv, bias, max_pool1, max_pool2, fq_bias, af1, af2, af3, af4, fq_af});
+        std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{conv, bias, max_pool1, max_pool2, fq_bias, af1, af2, af3, af4, af5, fq_af1, fq_af2});
     auto trailing_transpose = ngraph::pattern::wrap_type<ngraph::opset7::Transpose>({transpose_input, const_input},
         consumers_and_rank(1, 4));
 
diff --git a/inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.cpp b/inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.cpp
index 2aaec0604a8..24b13f1d5c5 100644
--- a/inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.cpp
+++ b/inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.cpp
@@ -12,8 +12,8 @@
 #include <ngraph/pattern/op/or.hpp>
 #include <ngraph/rt_info.hpp>
 #include <ngraph/pass/manager.hpp>
-#include <ie_common.h>
 #include "utils/transformation_helper.hpp"
+#include <gna/gna_config.hpp>
 #include "backend/gna_limitations.hpp"
 #include "layers/gna_convolution_layer.hpp"
 
@@ -71,10 +71,12 @@ static bool VerifyMaxPool(GraphData& graph_data, std::shared_ptr<ngraph::opset7:
     auto pool_strides = max_pool->get_strides();
 
     // Check Max Pool padding and limitations
+    // Allow only Max Pool 1D (2D is currently not supported by this transformation)
     if ((max_pool->get_auto_pad() != ngraph::op::PadType::VALID &&
         (max_pool->get_auto_pad() != ngraph::op::PadType::EXPLICIT ||
             max_pool->get_pads_begin() != ngraph::Shape({0, 0}) || max_pool->get_pads_end() != ngraph::Shape({0, 0}))) ||
         pool_filter.size() != 2 || pool_strides.size() != 2 ||
+        pool_filter[0] > 1 || pool_strides[0] > 1 ||
         pool_filter[0] > GNALimitations::maxPoolMaxWindowSize)
         return false;
 
@@ -83,6 +85,25 @@ static bool VerifyMaxPool(GraphData& graph_data, std::shared_ptr<ngraph::opset7:
     return true;
 }
 
+static bool GNA30SupportedConv(const std::string& gnaCompileTarget, const InferenceEngine::Precision& gnaPrecision,
+    const GraphData& graph_data, const ConvData& conv_data) {
+    const GNALimitations::Cnn2D::Validator cnn2dValidator;
+
+    if (gnaCompileTarget == InferenceEngine::GNAConfigParams::GNA_TARGET_3_0 &&
+        cnn2dValidator.ValidateCnn2D(graph_data.conv->get_friendly_name(),
+            conv_data.input_height, conv_data.input_width, conv_data.input_channel_count,
+            conv_data.filter_height, conv_data.filter_width, conv_data.filter_channel_count,
+            conv_data.filter_stride_height, conv_data.filter_stride_width, conv_data.filter_dilation_height, conv_data.filter_dilation_width,
+            OvGnaTypeIntFromBytes(gnaPrecision.size()), false) &&
+        (!graph_data.max_pool || cnn2dValidator.ValidatePooling2D(graph_data.conv->get_friendly_name(),
+            graph_data.max_pool->get_kernel()[0], graph_data.max_pool->get_kernel()[1],
+            graph_data.max_pool->get_strides()[0], graph_data.max_pool->get_strides()[1],
+            false)))
+        return true;
+
+    return false;
+}
+
 static size_t CalculateConvCount(const ConvData& conv_data) {
     // Check if split of plane due to GNA HW limitations of 768 filter elements is possible
     size_t conv_count = 1;
@@ -349,7 +370,7 @@ static std::shared_ptr<ngraph::Node> CreateDecomposedConv(const GraphData& graph
             // We need to calculate some parameters in case horizontal stride > 1 is used, because if we use the ones available from the original convolution
             // we won't take into account the fact horizontal strides will be supported by the newly created 1D convolution, and not by decomposition
             size_t filter_dilation_width = conv_data.filter_width > 1 ? conv_data.filter_dilation_width : 1;
-            size_t output_width = (conv_data.input_width - (conv_data.filter_width + filter_dilation_width - 2));
+            size_t output_width = (conv_data.input_width - (filter_dilation_width * (conv_data.filter_width - 1)));
 
             if (conv_data.filter_width > 1) {
                 for (size_t filter_width = 0; filter_width < conv_data.filter_width; filter_width++) {
@@ -442,7 +463,9 @@ static void Decompose(const GraphData& graph_data, ConvData& conv_data) {
     conv_result->set_friendly_name(conv_result_name);
 }
 
-static bool Convert(std::shared_ptr<ngraph::Node> leading_transpose,
+static bool Convert(const std::string& gnaCompileTarget,
+    const InferenceEngine::Precision& gnaPrecision,
+    std::shared_ptr<ngraph::Node> leading_transpose,
     std::shared_ptr<ngraph::Node> fq_conv,
     std::shared_ptr<ngraph::Node> conv,
     std::shared_ptr<ngraph::Node> trailing_transpose,
@@ -468,6 +491,13 @@ static bool Convert(std::shared_ptr<ngraph::Node> leading_transpose,
     if (!VerifyAndGetConvData(std::dynamic_pointer_cast<ngraph::opset7::Convolution>(conv), conv_data))
         return false;
 
+    if (max_pool && !VerifyMaxPool(graph_data, std::dynamic_pointer_cast<ngraph::opset7::MaxPool>(max_pool)))
+        return false;
+
+    // If compile target is GNA 3.0 and the convolution is supported on it, then skip decomposition
+    if (GNA30SupportedConv(gnaCompileTarget, gnaPrecision, graph_data, conv_data))
+        return false;
+
     // We are looking for Transpose(NHWC->NCHW) => Conv => Transpose(NCHW->NHWC)
     // or similar cases, so required network must be in NHWC order like in TF
     if (!TransposeOrderMatches(std::dynamic_pointer_cast<ngraph::opset7::Transpose>(leading_transpose), {0, 3, 1, 2}))
@@ -476,9 +506,6 @@ static bool Convert(std::shared_ptr<ngraph::Node> leading_transpose,
     if (!TransposeOrderMatches(std::dynamic_pointer_cast<ngraph::opset7::Transpose>(trailing_transpose), {0, 2, 3, 1}))
         return false;
 
-    if (max_pool && !VerifyMaxPool(graph_data, std::dynamic_pointer_cast<ngraph::opset7::MaxPool>(max_pool)))
-        return false;
-
     if (!ShouldDecompose(graph_data, conv_data))
         return false;
 
@@ -488,7 +515,7 @@ static bool Convert(std::shared_ptr<ngraph::Node> leading_transpose,
     return true;
 }
 
-Decompose2DConv::Decompose2DConv() {
+Decompose2DConv::Decompose2DConv(const std::string& gnaCompileTarget, const InferenceEngine::Precision& gnaPrecision) {
     MATCHER_SCOPE(Decompose2DConv);
 
     auto const_input = ngraph::pattern::wrap_type<ngraph::opset7::Constant>();
@@ -510,20 +537,25 @@ Decompose2DConv::Decompose2DConv() {
         ngraph::pattern::consumers_count(1));
     auto af1 = ngraph::pattern::wrap_type<ngraph::opset7::Relu, ngraph::opset7::Sigmoid,
         ngraph::opset7::Tanh, ngraph::opset7::Abs, ngraph::opset7::Log, ngraph::opset7::Exp,
-        ngraph::opset7::Sign, ngraph::opset7::Clamp>({bias}, ngraph::pattern::consumers_count(1));
+        ngraph::opset7::Sign, ngraph::opset7::Clamp>({conv}, ngraph::pattern::consumers_count(1));
     auto af2 = ngraph::pattern::wrap_type<ngraph::opset7::Relu, ngraph::opset7::Sigmoid,
         ngraph::opset7::Tanh, ngraph::opset7::Abs, ngraph::opset7::Log, ngraph::opset7::Exp,
-        ngraph::opset7::Sign, ngraph::opset7::Clamp>({fq_bias}, ngraph::pattern::consumers_count(1));
+        ngraph::opset7::Sign, ngraph::opset7::Clamp>({bias}, ngraph::pattern::consumers_count(1));
     auto af3 = ngraph::pattern::wrap_type<ngraph::opset7::Relu, ngraph::opset7::Sigmoid,
         ngraph::opset7::Tanh, ngraph::opset7::Abs, ngraph::opset7::Log, ngraph::opset7::Exp,
-        ngraph::opset7::Sign, ngraph::opset7::Clamp>({max_pool1}, ngraph::pattern::consumers_count(1));
+        ngraph::opset7::Sign, ngraph::opset7::Clamp>({fq_bias}, ngraph::pattern::consumers_count(1));
     auto af4 = ngraph::pattern::wrap_type<ngraph::opset7::Relu, ngraph::opset7::Sigmoid,
+        ngraph::opset7::Tanh, ngraph::opset7::Abs, ngraph::opset7::Log, ngraph::opset7::Exp,
+        ngraph::opset7::Sign, ngraph::opset7::Clamp>({max_pool1}, ngraph::pattern::consumers_count(1));
+    auto af5 = ngraph::pattern::wrap_type<ngraph::opset7::Relu, ngraph::opset7::Sigmoid,
         ngraph::opset7::Tanh, ngraph::opset7::Abs, ngraph::opset7::Log, ngraph::opset7::Exp,
         ngraph::opset7::Sign, ngraph::opset7::Clamp>({max_pool2}, ngraph::pattern::consumers_count(1));
-    auto fq_af = ngraph::pattern::wrap_type<ngraph::opset7::FakeQuantize>({af4, const_input, const_input, const_input, const_input},
+    auto fq_af1 = ngraph::pattern::wrap_type<ngraph::opset7::FakeQuantize>({af3, const_input, const_input, const_input, const_input},
+        ngraph::pattern::consumers_count(1));
+    auto fq_af2 = ngraph::pattern::wrap_type<ngraph::opset7::FakeQuantize>({af5, const_input, const_input, const_input, const_input},
         ngraph::pattern::consumers_count(1));
     auto transpose_input =
-        std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{conv, bias, max_pool1, max_pool2, fq_bias, af1, af2, af3, af4, fq_af});
+        std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{conv, bias, max_pool1, max_pool2, fq_bias, af1, af2, af3, af4, fq_af1, fq_af2});
     auto trailing_transpose = ngraph::pattern::wrap_type<ngraph::opset7::Transpose>({transpose_input, const_input},
         consumers_and_rank(1, 4));
 
@@ -540,8 +572,10 @@ Decompose2DConv::Decompose2DConv() {
 
         auto fq_bias_it = pattern_map.find(fq_bias);
         auto fq_bias_node = (fq_bias_it == std::end(pattern_map) ? nullptr : fq_bias_it->second.get_node_shared_ptr());
-        auto fq_af_it = pattern_map.find(fq_af);
-        auto fq_af_node = (fq_af_it == std::end(pattern_map) ? nullptr : fq_af_it->second.get_node_shared_ptr());
+        auto fq_af1_it = pattern_map.find(fq_af1);
+        auto fq_af2_it = pattern_map.find(fq_af2);
+        auto fq_af_node = (fq_af1_it == std::end(pattern_map) ?
+            ((fq_af2_it == std::end(pattern_map) ? nullptr : fq_af2_it->second.get_node_shared_ptr())) : fq_af1_it->second.get_node_shared_ptr());
         auto max_pool1_it = pattern_map.find(max_pool1);
         auto max_pool2_it = pattern_map.find(max_pool2);
         auto max_pool_node = (max_pool1_it == std::end(pattern_map) ?
@@ -557,7 +591,8 @@ Decompose2DConv::Decompose2DConv() {
             }
         }
 
-        return Convert(pattern_map.at(leading_transpose).get_node_shared_ptr(), fq_conv_node, pattern_map.at(conv).get_node_shared_ptr(),
+        return Convert(gnaCompileTarget, gnaPrecision,
+            pattern_map.at(leading_transpose).get_node_shared_ptr(), fq_conv_node, pattern_map.at(conv).get_node_shared_ptr(),
             pattern_map.at(trailing_transpose).get_node_shared_ptr(), bias_node, bias_const_node, fq_bias_node, max_pool_node, af_node, fq_af_node,
             pattern_map.at(trailing_transpose).get_node_shared_ptr());
     };
@@ -566,7 +601,7 @@ Decompose2DConv::Decompose2DConv() {
     this->register_matcher(m, callback);
 }
 
-Decompose2DConvTransposedWithBias::Decompose2DConvTransposedWithBias() {
+Decompose2DConvTransposedWithBias::Decompose2DConvTransposedWithBias(const std::string& gnaCompileTarget, const InferenceEngine::Precision& gnaPrecision) {
     MATCHER_SCOPE(Decompose2DConvTransposedWithBias);
 
     auto const_input_i64 = ngraph::pattern::wrap_type<ngraph::opset7::Constant>(ngraph::pattern::type_matches(ngraph::element::i64));
@@ -588,7 +623,8 @@ Decompose2DConvTransposedWithBias::Decompose2DConvTransposedWithBias() {
         if (!(bias_const_node = VerifyBiasGetConst(pattern_map.at(conv).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr())))
             return false;
 
-        return Convert(pattern_map.at(leading_transpose).get_node_shared_ptr(), nullptr, pattern_map.at(conv).get_node_shared_ptr(),
+        return Convert(gnaCompileTarget, gnaPrecision,
+            pattern_map.at(leading_transpose).get_node_shared_ptr(), nullptr, pattern_map.at(conv).get_node_shared_ptr(),
             pattern_map.at(trailing_transpose).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr(), bias_const_node, nullptr, nullptr,
             nullptr, nullptr, pattern_map.at(bias).get_node_shared_ptr());
     };
@@ -597,7 +633,7 @@ Decompose2DConvTransposedWithBias::Decompose2DConvTransposedWithBias() {
     this->register_matcher(m, callback);
 }
 
-Decompose2DConvTransposedWithBiasAF::Decompose2DConvTransposedWithBiasAF() {
+Decompose2DConvTransposedWithBiasAF::Decompose2DConvTransposedWithBiasAF(const std::string& gnaCompileTarget, const InferenceEngine::Precision& gnaPrecision) {
     MATCHER_SCOPE(Decompose2DConvTransposedWithBiasAF);
 
     auto const_input_i64 = ngraph::pattern::wrap_type<ngraph::opset7::Constant>(ngraph::pattern::type_matches(ngraph::element::i64));
@@ -623,7 +659,8 @@ Decompose2DConvTransposedWithBiasAF::Decompose2DConvTransposedWithBiasAF() {
         if (!(bias_const_node = VerifyBiasGetConst(pattern_map.at(conv).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr())))
             return false;
 
-        return Convert(pattern_map.at(leading_transpose).get_node_shared_ptr(), nullptr, pattern_map.at(conv).get_node_shared_ptr(),
+        return Convert(gnaCompileTarget, gnaPrecision,
+            pattern_map.at(leading_transpose).get_node_shared_ptr(), nullptr, pattern_map.at(conv).get_node_shared_ptr(),
             pattern_map.at(trailing_transpose).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr(), bias_const_node, nullptr,
             nullptr, pattern_map.at(af).get_node_shared_ptr(), nullptr, pattern_map.at(af).get_node_shared_ptr());
     };
diff --git a/inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.hpp b/inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.hpp
index 4fbaf47ff72..6b4c0c4c017 100644
--- a/inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.hpp
+++ b/inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.hpp
@@ -5,6 +5,7 @@
 #pragma once
 
 #include <ngraph/pass/graph_rewrite.hpp>
+#include <ie_precision.hpp>
 
 namespace GNAPluginNS {
 
@@ -30,7 +31,7 @@ namespace GNAPluginNS {
 class Decompose2DConv : public ngraph::pass::MatcherPass {
 public:
     NGRAPH_RTTI_DECLARATION;
-    Decompose2DConv();
+    Decompose2DConv(const std::string& gnaCompileTarget, const InferenceEngine::Precision& gnaPrecision);
 };
 
 /**
@@ -51,7 +52,7 @@ public:
 class Decompose2DConvTransposedWithBias : public ngraph::pass::MatcherPass {
 public:
     NGRAPH_RTTI_DECLARATION;
-    Decompose2DConvTransposedWithBias();
+    Decompose2DConvTransposedWithBias(const std::string& gnaCompileTarget, const InferenceEngine::Precision& gnaPrecision);
 };
 
 /**
@@ -74,7 +75,7 @@ public:
 class Decompose2DConvTransposedWithBiasAF : public ngraph::pass::MatcherPass {
 public:
     NGRAPH_RTTI_DECLARATION;
-    Decompose2DConvTransposedWithBiasAF();
+    Decompose2DConvTransposedWithBiasAF(const std::string& gnaCompileTarget, const InferenceEngine::Precision& gnaPrecision);
 };
 
 } // namespace GNAPluginNS
diff --git a/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.cpp b/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.cpp
index c70da2db49c..040389b80ee 100644
--- a/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.cpp
+++ b/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.cpp
@@ -73,8 +73,8 @@ std::shared_ptr<ngraph::opset7::StridedSlice> FlatCrop(ngraph::Output<ngraph::No
         std::vector<int64_t>{1, 0});                                                                            // end mask
 }
 
-std::shared_ptr<ngraph::Node> VerifyBiasGetConst(std::shared_ptr<ngraph::Node> conv, std::shared_ptr<ngraph::Node> bias) {
-    auto add_const = std::dynamic_pointer_cast<ngraph::opset7::Constant>(bias->input_value(1).get_node_shared_ptr());
+std::shared_ptr<ngraph::Node> VerifyBiasGetConst(std::shared_ptr<ngraph::Node> conv, std::shared_ptr<ngraph::Node> add) {
+    auto add_const = std::dynamic_pointer_cast<ngraph::opset7::Constant>(add->input_value(1).get_node_shared_ptr());
 
     // Check if it's really a bias and not just addition
     if (add_const) {
diff --git a/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.hpp b/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.hpp
index d09f09fa18d..a9a8b061327 100644
--- a/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.hpp
+++ b/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.hpp
@@ -65,13 +65,13 @@ std::shared_ptr<ngraph::opset7::StridedSlice> FlatCrop(ngraph::Output<ngraph::No
 /**
  * @brief checks whether an add present after convolution is a bias and gets its const input
  * @param conv convolution layer preceding potential bias
- * @param bias potential bias layer passed from ngraph matcher
+ * @param add potential bias layer passed from ngraph matcher
  * @return bias const if the add layer present after convolution is a bias, nullptr otherwise
  */
-std::shared_ptr<ngraph::Node> VerifyBiasGetConst(std::shared_ptr<ngraph::Node> conv, std::shared_ptr<ngraph::Node> bias);
+std::shared_ptr<ngraph::Node> VerifyBiasGetConst(std::shared_ptr<ngraph::Node> conv, std::shared_ptr<ngraph::Node> add);
 
 /**
- * @brief inserts a new fake quantize layer (if it exists) copied from an existing fake quantize layer and conncts it to the output of a given layer
+ * @brief inserts a new fake quantize layer copied from an existing one and connects it to the output of a given layer
  * @param fq_layer existing fake quantize layer to be copied
  * @param last_node the node to which output the new fake quantize layer will be connected
  * @return new fake quantize layer or the last node
diff --git a/inference-engine/src/inference_engine/CMakeLists.txt b/inference-engine/src/inference_engine/CMakeLists.txt
index 1162adf49c6..73ef940bd16 100644
--- a/inference-engine/src/inference_engine/CMakeLists.txt
+++ b/inference-engine/src/inference_engine/CMakeLists.txt
@@ -99,7 +99,7 @@ target_include_directories(${TARGET_NAME}_plugin_api INTERFACE
     $<TARGET_PROPERTY:${TARGET_NAME}_preproc,INTERFACE_INCLUDE_DIRECTORIES>
     ${PUBLIC_HEADERS_DIR} ${PUBLIC_HEADERS_DIR}/ie)
 
-target_link_libraries(${TARGET_NAME}_plugin_api INTERFACE pugixml::static openvino::itt)
+target_link_libraries(${TARGET_NAME}_plugin_api INTERFACE pugixml::static openvino::itt openvino::util)
 
 set_ie_threading_interface_for(${TARGET_NAME}_plugin_api)
 
@@ -129,12 +129,12 @@ target_include_directories(${TARGET_NAME}_obj SYSTEM PRIVATE $<TARGET_PROPERTY:n
                                                              $<TARGET_PROPERTY:xbyak,INTERFACE_INCLUDE_DIRECTORIES>)
 
 target_include_directories(${TARGET_NAME}_obj PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}/src"
-                                                      "${IE_MAIN_SOURCE_DIR}/src/readers/ir_reader" # for ie_ir_version.hpp
+                                                      "${IE_MAIN_SOURCE_DIR}/src/readers/ir_reader_v7" # for ie_ir_version.hpp
                                                       $<TARGET_PROPERTY:${TARGET_NAME}_legacy,INTERFACE_INCLUDE_DIRECTORIES>
                                                       $<TARGET_PROPERTY:${TARGET_NAME}_transformations,INTERFACE_INCLUDE_DIRECTORIES>
                                                       $<TARGET_PROPERTY:${TARGET_NAME}_plugin_api,INTERFACE_INCLUDE_DIRECTORIES>)
 
-target_link_libraries(${TARGET_NAME}_obj PRIVATE ${TARGET_NAME}_reader_api openvino::itt)
+target_link_libraries(${TARGET_NAME}_obj PRIVATE ${TARGET_NAME}_reader_api openvino::itt openvino::util)
 
 set_ie_threading_interface_for(${TARGET_NAME}_obj)
 if (TBBBIND_2_4_FOUND)
@@ -167,7 +167,7 @@ if (TBBBIND_2_4_FOUND)
     target_link_libraries(${TARGET_NAME} PRIVATE ${TBBBIND_2_4_IMPORTED_TARGETS})
 endif()
 
-target_link_libraries(${TARGET_NAME} PRIVATE pugixml::static openvino::itt ${CMAKE_DL_LIBS} Threads::Threads
+target_link_libraries(${TARGET_NAME} PRIVATE pugixml::static openvino::itt openvino::util ${CMAKE_DL_LIBS} Threads::Threads
                                              frontend_manager::static inference_engine_transformations
                                      PUBLIC ngraph)
 
diff --git a/inference-engine/src/inference_engine/include/ie/ie_blob.h b/inference-engine/src/inference_engine/include/ie/ie_blob.h
index 21342ae73da..aa625e6f33c 100644
--- a/inference-engine/src/inference_engine/include/ie/ie_blob.h
+++ b/inference-engine/src/inference_engine/include/ie/ie_blob.h
@@ -242,6 +242,18 @@ public:
      */
     virtual Blob::Ptr createROI(const ROI& roi) const;
 
+    /**
+     * @brief Creates a blob describing given ROI object based on the current blob with memory sharing.
+     *
+     * Note: default implementation may throws "not implemented" exception.
+     *
+     * @param begin A ROI start coordinate
+     * @param end A ROI end coordinate
+     *
+     * @return A shared pointer to the newly created ROI blob.
+     */
+    virtual Blob::Ptr createROI(const std::vector<std::size_t>& begin, const std::vector<std::size_t>& end) const;
+
 protected:
     /**
      * @brief The tensor descriptor of the given blob.
@@ -662,6 +674,10 @@ public:
         return Blob::Ptr(new TBlob<T>(*this, roi));
     }
 
+    Blob::Ptr createROI(const std::vector<std::size_t>& begin, const std::vector<std::size_t>& end) const override {
+        return Blob::Ptr(new TBlob<T>(*this, begin, end));
+    }
+
     /**
      * @brief Gets BlobIterator for the data.
      *
@@ -789,6 +805,20 @@ protected:
 
         _handle = origBlob._handle;
     }
+
+    /**
+     * @brief Creates a blob from the existing blob with a given ROI
+     * @param origBlob An original blob
+     * @param begin ROI start coordinate
+     * @param end ROI end coordinate
+     */
+    TBlob(const TBlob& origBlob, const std::vector<size_t>& begin, const std::vector<size_t>& end)
+        : MemoryBlob(make_roi_desc(origBlob.getTensorDesc(), begin, end, true)),
+          _allocator(origBlob._allocator) {
+        IE_ASSERT(origBlob._handle != nullptr) << "Original Blob must be allocated before ROI creation";
+
+        _handle = origBlob._handle;
+    }
 };
 
 #ifdef __clang__
@@ -892,4 +922,15 @@ std::shared_ptr<T> make_shared_blob(Args&&... args) {
  */
 INFERENCE_ENGINE_API_CPP(Blob::Ptr) make_shared_blob(const Blob::Ptr& inputBlob, const ROI& roi);
 
+/**
+ * @brief Creates a blob describing given ROI object based on the given blob with pre-allocated memory.
+ *
+ * @param inputBlob original blob with pre-allocated memory.
+ * @param begin A ROI object start coordinate inside of the original blob.
+ * @param end A ROI object end coordinate inside of the original blob.
+ * @return A shared pointer to the newly created blob.
+ */
+INFERENCE_ENGINE_API_CPP(Blob::Ptr)
+make_shared_blob(const Blob::Ptr& inputBlob, const std::vector<size_t>& begin, const std::vector<size_t>& end);
+
 }  // namespace InferenceEngine
diff --git a/inference-engine/src/inference_engine/include/ie/ie_layouts.h b/inference-engine/src/inference_engine/include/ie/ie_layouts.h
index f1f8ef382ce..76aa5d62ae9 100644
--- a/inference-engine/src/inference_engine/include/ie/ie_layouts.h
+++ b/inference-engine/src/inference_engine/include/ie/ie_layouts.h
@@ -374,4 +374,21 @@ struct ROI {
  */
 INFERENCE_ENGINE_API_CPP(TensorDesc) make_roi_desc(const TensorDesc& origDesc, const ROI& roi, bool useOrigMemDesc);
 
+/**
+ * @brief Creates a TensorDesc object for ROI.
+ *
+ * @param origDesc original TensorDesc object.
+ * @param begin start coordinate of ROI object inside of the original object.
+ * @param end end coordinate of ROI object inside of the original object.
+ * @param useOrigMemDesc Flag to use original memory description (strides/offset).
+ *     Should be set if the new TensorDesc describes shared memory.
+ *
+ * @return A newly created TensorDesc object representing ROI.
+ */
+INFERENCE_ENGINE_API_CPP(TensorDesc)
+make_roi_desc(const TensorDesc& origDesc,
+              const std::vector<size_t>& begin,
+              const std::vector<size_t>& end,
+              bool useOrigMemDesc);
+
 }  // namespace InferenceEngine
diff --git a/inference-engine/src/inference_engine/include/ie/ie_parameter.hpp b/inference-engine/src/inference_engine/include/ie/ie_parameter.hpp
index f68637b5e0d..0be3fd9d786 100644
--- a/inference-engine/src/inference_engine/include/ie/ie_parameter.hpp
+++ b/inference-engine/src/inference_engine/include/ie/ie_parameter.hpp
@@ -20,341 +20,21 @@
 #include <vector>
 
 #include "ie_blob.h"
+#include "openvino/runtime/parameter.hpp"
 
 namespace InferenceEngine {
 
-/**
- * @brief This class represents an object to work with different parameters
- *
- */
-class INFERENCE_ENGINE_API_CLASS(Parameter) {
-public:
-    /**
-     * @brief Default constructor
-     */
-    Parameter() = default;
+using ov::runtime::Parameter;
+using ov::runtime::ParamMap;
 
-    /**
-     * @brief Move constructor
-     *
-     * @param parameter Parameter object
-     */
-    Parameter(Parameter&& parameter) noexcept {
-        std::swap(ptr, parameter.ptr);
-    }
+}  // namespace InferenceEngine
 
-    /**
-     * @brief Copy constructor
-     *
-     * @param parameter Parameter object
-     */
-    Parameter(const Parameter& parameter) {
-        *this = parameter;
-    }
-
-    /**
-     * @brief Constructor creates parameter with object
-     *
-     * @tparam T Parameter type
-     * @tparam U Identity type-transformation
-     * @param parameter object
-     */
-    template <class T,
-              typename = typename std::enable_if<!std::is_same<typename std::decay<T>::type, Parameter>::value &&
-                                                 !std::is_abstract<typename std::decay<T>::type>::value>::type>
-    Parameter(T&& parameter) {
-        static_assert(!std::is_same<typename std::decay<T>::type, Parameter>::value, "To prevent recursion");
-        ptr = new RealData<typename std::decay<T>::type>(std::forward<T>(parameter));
-    }
-
-    /**
-     * @brief Constructor creates string parameter from char *
-     *
-     * @param str char array
-     */
-    Parameter(const char* str) : Parameter(std::string(str)) {}
-
-    /**
-     * @brief Destructor
-     */
-    virtual ~Parameter();
-
-    /**
-     * Copy operator for Parameter
-     * @param parameter Parameter object
-     * @return Parameter
-     */
-    Parameter& operator=(const Parameter& parameter) {
-        if (this == &parameter) {
-            return *this;
-        }
-        clear();
-        if (!parameter.empty())
-            ptr = parameter.ptr->copy();
-        return *this;
-    }
-
-    /**
-     * Remove a value from parameter
-     */
-    void clear() {
-        delete ptr;
-        ptr = nullptr;
-    }
-
-    /**
-     * Checks that parameter contains a value
-     * @return false if parameter contains a value else false
-     */
-    bool empty() const noexcept {
-        return nullptr == ptr;
-    }
-
-    /**
-     * Checks the type of value
-     * @tparam T Type of value
-     * @return true if type of value is correct
-     */
-    template <class T>
-    bool is() const {
-        return empty() ? false : ptr->is(typeid(T));
-    }
-
-    /**
-     * Dynamic cast to specified type
-     * @tparam T type
-     * @return casted object
-     */
-    template <typename T>
-    T&& as() && {
-        return std::move(dyn_cast<T>(ptr));
-    }
-
-    /**
-     * Dynamic cast to specified type
-     * @tparam T type
-     * @return casted object
-     */
-    template <class T>
-    T& as() & {
-        return dyn_cast<T>(ptr);
-    }
-    /**
-     * Dynamic cast to specified type
-     * @tparam T type
-     * @return casted object
-     */
-    template <class T>
-    const T& as() const& {
-        return dyn_cast<T>(ptr);
-    }
-
-    /**
-     * Dynamic cast to specified type
-     * @tparam T type
-     * @return casted object
-     */
-    template <class T>
-    operator T &&() && {
-        return std::move(dyn_cast<typename std::remove_cv<T>::type>(ptr));
-    }
-
-    /**
-     * Dynamic cast to specified type
-     * @tparam T type
-     * @return casted object
-     */
-    template <class T>
-    operator T&() & {
-        return dyn_cast<typename std::remove_cv<T>::type>(ptr);
-    }
-
-    /**
-     * Dynamic cast to specified type
-     * @tparam T type
-     * @return casted object
-     */
-    template <class T>
-    operator const T&() const& {
-        return dyn_cast<typename std::remove_cv<T>::type>(ptr);
-    }
-
-    /**
-     * Dynamic cast to specified type
-     * @tparam T type
-     * @return casted object
-     */
-    template <class T>
-    operator T&() const& {
-        return dyn_cast<typename std::remove_cv<T>::type>(ptr);
-    }
-
-    /**
-     * @brief The comparison operator for the Parameter
-     *
-     * @param rhs object to compare
-     * @return true if objects are equal
-     */
-    bool operator==(const Parameter& rhs) const {
-        return *ptr == *(rhs.ptr);
-    }
-    /**
-     * @brief The comparison operator for the Parameter
-     *
-     * @param rhs object to compare
-     * @return true if objects aren't equal
-     */
-    bool operator!=(const Parameter& rhs) const {
-        return !(*this == rhs);
-    }
-
-    /**
-     * @brief Prints underlying object to the given output stream.
-     * Uses operator<< if it is defined, leaves stream unchanged otherwise.
-     * In case of empty parameter or nullptr stream immediately returns.
-     *
-     * @param object Object to be printed to the given output stream.
-     * @param stream Output stream object will be printed to.
-     */
-    friend void PrintTo(const Parameter& object, std::ostream* stream) {
-        if (object.empty() || !stream) {
-            return;
-        }
-        object.ptr->print(*stream);
-    }
-
-private:
-    template <class T, class EqualTo>
-    struct CheckOperatorEqual {
-        template <class U, class V>
-        static auto test(U*) -> decltype(std::declval<U>() == std::declval<V>()) {
-            return false;
-        }
-
-        template <typename, typename>
-        static auto test(...) -> std::false_type {
-            return {};
-        }
-
-        using type = typename std::is_same<bool, decltype(test<T, EqualTo>(nullptr))>::type;
-    };
-
-    template <class T, class EqualTo = T>
-    struct HasOperatorEqual : CheckOperatorEqual<T, EqualTo>::type {};
-
-    template <class T, class U>
-    struct CheckOutputStreamOperator {
-        template <class V, class W>
-        static auto test(W*) -> decltype(std::declval<V&>() << std::declval<W>(), std::true_type()) {
-            return {};
-        }
-
-        template <typename, typename>
-        static auto test(...) -> std::false_type {
-            return {};
-        }
-
-        using type = typename std::is_same<std::true_type, decltype(test<T, U>(nullptr))>::type;
-    };
-
-    template <class T>
-    struct HasOutputStreamOperator : CheckOutputStreamOperator<std::ostream, T>::type {};
-
-    struct Any {
-#ifdef __ANDROID__
-        virtual ~Any();
-#else
-        virtual ~Any() = default;
-#endif
-        virtual bool is(const std::type_info&) const = 0;
-        virtual Any* copy() const = 0;
-        virtual bool operator==(const Any& rhs) const = 0;
-        virtual void print(std::ostream&) const = 0;
-    };
-
-    template <class T>
-    struct RealData : Any, std::tuple<T> {
-        using std::tuple<T>::tuple;
-
-        bool is(const std::type_info& id) const override {
-            return id == typeid(T);
-        }
-        Any* copy() const override {
-            return new RealData{get()};
-        }
-
-        T& get() & {
-            return std::get<0>(*static_cast<std::tuple<T>*>(this));
-        }
-
-        const T& get() const& {
-            return std::get<0>(*static_cast<const std::tuple<T>*>(this));
-        }
-
-        template <class U>
-        typename std::enable_if<!HasOperatorEqual<U>::value, bool>::type equal(const Any& left, const Any& rhs) const {
-            IE_THROW() << "Parameter doesn't contain equal operator";
-        }
-
-        template <class U>
-        typename std::enable_if<HasOperatorEqual<U>::value, bool>::type equal(const Any& left, const Any& rhs) const {
-            return dyn_cast<U>(&left) == dyn_cast<U>(&rhs);
-        }
-
-        bool operator==(const Any& rhs) const override {
-            return rhs.is(typeid(T)) && equal<T>(*this, rhs);
-        }
-
-        template <class U, typename std::enable_if<!HasOutputStreamOperator<U>::value, bool>::type = true>
-        void print(std::ostream& stream, const U& object) const {}
-
-        template <class U, typename std::enable_if<HasOutputStreamOperator<U>::value, bool>::type = true>
-        void print(std::ostream& stream, const U& object) const {
-            stream << object;
-        }
-
-        void print(std::ostream& stream) const override {
-            print<T>(stream, get());
-        }
-    };
-
-    template <typename T>
-    static T& dyn_cast(Any* obj) {
-        if (obj == nullptr)
-            IE_THROW() << "Parameter is empty!";
-        return dynamic_cast<RealData<T>&>(*obj).get();
-    }
-
-    template <typename T>
-    static const T& dyn_cast(const Any* obj) {
-        if (obj == nullptr)
-            IE_THROW() << "Parameter is empty!";
-        return dynamic_cast<const RealData<T>&>(*obj).get();
-    }
-
-    Any* ptr = nullptr;
-};
-
-/**
- * @brief An std::map object containing parameters
- */
-using ParamMap = std::map<std::string, Parameter>;
+namespace ov {
+namespace runtime {
 
 #ifdef __ANDROID__
 extern template struct INFERENCE_ENGINE_API_CLASS(InferenceEngine::Parameter::RealData<InferenceEngine::Blob::Ptr>);
-extern template struct INFERENCE_ENGINE_API_CLASS(InferenceEngine::Parameter::RealData<int>);
-extern template struct INFERENCE_ENGINE_API_CLASS(InferenceEngine::Parameter::RealData<bool>);
-extern template struct INFERENCE_ENGINE_API_CLASS(InferenceEngine::Parameter::RealData<float>);
-extern template struct INFERENCE_ENGINE_API_CLASS(InferenceEngine::Parameter::RealData<uint32_t>);
-extern template struct INFERENCE_ENGINE_API_CLASS(InferenceEngine::Parameter::RealData<std::string>);
-extern template struct INFERENCE_ENGINE_API_CLASS(InferenceEngine::Parameter::RealData<unsigned long>);
-extern template struct INFERENCE_ENGINE_API_CLASS(InferenceEngine::Parameter::RealData<std::vector<int>>);
-extern template struct INFERENCE_ENGINE_API_CLASS(InferenceEngine::Parameter::RealData<std::vector<std::string>>);
-extern template struct INFERENCE_ENGINE_API_CLASS(InferenceEngine::Parameter::RealData<std::vector<unsigned long>>);
-extern template struct INFERENCE_ENGINE_API_CLASS(
-    InferenceEngine::Parameter::RealData<std::tuple<unsigned int, unsigned int>>);
-extern template struct INFERENCE_ENGINE_API_CLASS(
-    InferenceEngine::Parameter::RealData<std::tuple<unsigned int, unsigned int, unsigned int>>);
 #endif
 
-}  // namespace InferenceEngine
+}  // namespace runtime
+}  // namespace ov
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/core.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/core.hpp
index c2c9a475d47..2c0efb929eb 100644
--- a/inference-engine/src/inference_engine/include/openvino/runtime/core.hpp
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/core.hpp
@@ -15,11 +15,11 @@
 #include <string>
 #include <vector>
 
-#include "common.hpp"
-#include "executable_network.hpp"
 #include "ie_plugin_config.hpp"
 #include "ie_version.hpp"
-#include "remote_context.hpp"
+#include "openvino/runtime/common.hpp"
+#include "openvino/runtime/executable_network.hpp"
+#include "openvino/runtime/remote_context.hpp"
 
 namespace InferenceEngine {
 class IExtension;
@@ -213,7 +213,7 @@ public:
      * @param name  - config key.
      * @return Value of config corresponding to config key.
      */
-    ie::Parameter get_config(const std::string& deviceName, const std::string& name) const;
+    Parameter get_config(const std::string& deviceName, const std::string& name) const;
 
     /**
      * @brief Gets general runtime metric for dedicated hardware.
@@ -225,7 +225,7 @@ public:
      * @param name - metric name to request.
      * @return Metric value corresponding to metric key.
      */
-    ie::Parameter get_metric(const std::string& deviceName, const std::string& name) const;
+    Parameter get_metric(const std::string& deviceName, const std::string& name) const;
 
     /**
      * @brief Returns devices available for neural networks inference
@@ -292,7 +292,7 @@ public:
      * @param params Map of device-specific shared context parameters.
      * @return A shared pointer to a created remote context.
      */
-    RemoteContext create_context(const std::string& deviceName, const ie::ParamMap& params);
+    RemoteContext create_context(const std::string& deviceName, const ParamMap& params);
 
     /**
      * @brief Get a pointer to default(plugin-supplied) shared context object for specified accelerator device.
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/executable_network.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/executable_network.hpp
index 1190eaca0e2..f3bf860ad1c 100644
--- a/inference-engine/src/inference_engine/include/openvino/runtime/executable_network.hpp
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/executable_network.hpp
@@ -16,9 +16,9 @@
 #include <string>
 #include <vector>
 
-#include "ie_parameter.hpp"
 #include "openvino/core/function.hpp"
 #include "openvino/runtime/infer_request.hpp"
+#include "openvino/runtime/parameter.hpp"
 #include "openvino/runtime/remote_context.hpp"
 
 namespace InferenceEngine {
@@ -96,7 +96,7 @@ public:
      *
      * @param config Map of pairs: (config parameter name, config parameter value)
      */
-    void set_config(const ie::ParamMap& config);
+    void set_config(const ParamMap& config);
 
     /** @brief Gets configuration for current executable network.
      *
@@ -109,7 +109,7 @@ public:
      * @param name config key, can be found in ie_plugin_config.hpp
      * @return Configuration parameter value
      */
-    ie::Parameter get_config(const std::string& name) const;
+    Parameter get_config(const std::string& name) const;
 
     /**
      * @brief Gets general runtime metric for an executable network.
@@ -120,7 +120,7 @@ public:
      * @param name metric name to request
      * @return Metric parameter value
      */
-    ie::Parameter get_metric(const std::string& name) const;
+    Parameter get_metric(const std::string& name) const;
 
     /**
      * @brief Returns pointer to plugin-specific shared context
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/infer_request.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/infer_request.hpp
index fc5969b446d..5f58c43d31c 100644
--- a/inference-engine/src/inference_engine/include/openvino/runtime/infer_request.hpp
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/infer_request.hpp
@@ -5,7 +5,7 @@
 /**
  * @brief A header file that provides wrapper classes for infer requests and callbacks.
  *
- * @file infer_request.hpp
+ * @file openvino/runtime/infer_request.hpp
  */
 #pragma once
 
@@ -13,9 +13,9 @@
 #include <memory>
 #include <string>
 
-#include "common.hpp"
-#include "profiling_info.hpp"
-#include "variable_state.hpp"
+#include "openvino/runtime/common.hpp"
+#include "openvino/runtime/profiling_info.hpp"
+#include "openvino/runtime/variable_state.hpp"
 
 namespace InferenceEngine {
 class IInferRequestInternal;
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/parameter.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/parameter.hpp
new file mode 100644
index 00000000000..e1d7cc1728e
--- /dev/null
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/parameter.hpp
@@ -0,0 +1,362 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+/**
+ * @brief A header file for the Parameter class
+ * @file openvino/runtime/parameter.hpp
+ */
+#pragma once
+
+#include <algorithm>
+#include <cctype>
+#include <iterator>
+#include <map>
+#include <memory>
+#include <string>
+#include <tuple>
+#include <typeinfo>
+#include <utility>
+#include <vector>
+
+#include "ie_api.h"
+#include "openvino/core/except.hpp"
+
+namespace ov {
+
+namespace runtime {
+
+/**
+ * @brief This class represents an object to work with different parameters
+ *
+ */
+class INFERENCE_ENGINE_API_CLASS(Parameter) {
+public:
+    /**
+     * @brief Default constructor
+     */
+    Parameter() = default;
+
+    /**
+     * @brief Move constructor
+     *
+     * @param parameter Parameter object
+     */
+    Parameter(Parameter&& parameter) noexcept {
+        std::swap(ptr, parameter.ptr);
+    }
+
+    /**
+     * @brief Copy constructor
+     *
+     * @param parameter Parameter object
+     */
+    Parameter(const Parameter& parameter) {
+        *this = parameter;
+    }
+
+    /**
+     * @brief Constructor creates parameter with object
+     *
+     * @tparam T Parameter type
+     * @tparam U Identity type-transformation
+     * @param parameter object
+     */
+    template <class T,
+              typename = typename std::enable_if<!std::is_same<typename std::decay<T>::type, Parameter>::value &&
+                                                 !std::is_abstract<typename std::decay<T>::type>::value>::type>
+    Parameter(T&& parameter) {
+        static_assert(!std::is_same<typename std::decay<T>::type, Parameter>::value, "To prevent recursion");
+        ptr = new RealData<typename std::decay<T>::type>(std::forward<T>(parameter));
+    }
+
+    /**
+     * @brief Constructor creates string parameter from char *
+     *
+     * @param str char array
+     */
+    Parameter(const char* str) : Parameter(std::string(str)) {}
+
+    /**
+     * @brief Destructor
+     */
+    virtual ~Parameter();
+
+    /**
+     * Copy operator for Parameter
+     * @param parameter Parameter object
+     * @return Parameter
+     */
+    Parameter& operator=(const Parameter& parameter) {
+        if (this == &parameter) {
+            return *this;
+        }
+        clear();
+        if (!parameter.empty())
+            ptr = parameter.ptr->copy();
+        return *this;
+    }
+
+    /**
+     * Remove a value from parameter
+     */
+    void clear() {
+        delete ptr;
+        ptr = nullptr;
+    }
+
+    /**
+     * Checks that parameter contains a value
+     * @return false if parameter contains a value else false
+     */
+    bool empty() const noexcept {
+        return nullptr == ptr;
+    }
+
+    /**
+     * Checks the type of value
+     * @tparam T Type of value
+     * @return true if type of value is correct
+     */
+    template <class T>
+    bool is() const {
+        return empty() ? false : ptr->is(typeid(T));
+    }
+
+    /**
+     * Dynamic cast to specified type
+     * @tparam T type
+     * @return casted object
+     */
+    template <typename T>
+    T&& as() && {
+        return std::move(dyn_cast<T>(ptr));
+    }
+
+    /**
+     * Dynamic cast to specified type
+     * @tparam T type
+     * @return casted object
+     */
+    template <class T>
+    T& as() & {
+        return dyn_cast<T>(ptr);
+    }
+    /**
+     * Dynamic cast to specified type
+     * @tparam T type
+     * @return casted object
+     */
+    template <class T>
+    const T& as() const& {
+        return dyn_cast<T>(ptr);
+    }
+
+    /**
+     * Dynamic cast to specified type
+     * @tparam T type
+     * @return casted object
+     */
+    template <class T>
+    operator T &&() && {
+        return std::move(dyn_cast<typename std::remove_cv<T>::type>(ptr));
+    }
+
+    /**
+     * Dynamic cast to specified type
+     * @tparam T type
+     * @return casted object
+     */
+    template <class T>
+    operator T&() & {
+        return dyn_cast<typename std::remove_cv<T>::type>(ptr);
+    }
+
+    /**
+     * Dynamic cast to specified type
+     * @tparam T type
+     * @return casted object
+     */
+    template <class T>
+    operator const T&() const& {
+        return dyn_cast<typename std::remove_cv<T>::type>(ptr);
+    }
+
+    /**
+     * Dynamic cast to specified type
+     * @tparam T type
+     * @return casted object
+     */
+    template <class T>
+    operator T&() const& {
+        return dyn_cast<typename std::remove_cv<T>::type>(ptr);
+    }
+
+    /**
+     * @brief The comparison operator for the Parameter
+     *
+     * @param rhs object to compare
+     * @return true if objects are equal
+     */
+    bool operator==(const Parameter& rhs) const {
+        return *ptr == *(rhs.ptr);
+    }
+    /**
+     * @brief The comparison operator for the Parameter
+     *
+     * @param rhs object to compare
+     * @return true if objects aren't equal
+     */
+    bool operator!=(const Parameter& rhs) const {
+        return !(*this == rhs);
+    }
+
+    /**
+     * @brief Prints underlying object to the given output stream.
+     * Uses operator<< if it is defined, leaves stream unchanged otherwise.
+     * In case of empty parameter or nullptr stream immediately returns.
+     *
+     * @param object Object to be printed to the given output stream.
+     * @param stream Output stream object will be printed to.
+     */
+    friend void PrintTo(const Parameter& object, std::ostream* stream) {
+        if (object.empty() || !stream) {
+            return;
+        }
+        object.ptr->print(*stream);
+    }
+
+private:
+    template <class T, class EqualTo>
+    struct CheckOperatorEqual {
+        template <class U, class V>
+        static auto test(U*) -> decltype(std::declval<U>() == std::declval<V>()) {
+            return false;
+        }
+
+        template <typename, typename>
+        static auto test(...) -> std::false_type {
+            return {};
+        }
+
+        using type = typename std::is_same<bool, decltype(test<T, EqualTo>(nullptr))>::type;
+    };
+
+    template <class T, class EqualTo = T>
+    struct HasOperatorEqual : CheckOperatorEqual<T, EqualTo>::type {};
+
+    template <class T, class U>
+    struct CheckOutputStreamOperator {
+        template <class V, class W>
+        static auto test(W*) -> decltype(std::declval<V&>() << std::declval<W>(), std::true_type()) {
+            return {};
+        }
+
+        template <typename, typename>
+        static auto test(...) -> std::false_type {
+            return {};
+        }
+
+        using type = typename std::is_same<std::true_type, decltype(test<T, U>(nullptr))>::type;
+    };
+
+    template <class T>
+    struct HasOutputStreamOperator : CheckOutputStreamOperator<std::ostream, T>::type {};
+
+    struct Any {
+#ifdef __ANDROID__
+        virtual ~Any();
+#else
+        virtual ~Any() = default;
+#endif
+        virtual bool is(const std::type_info&) const = 0;
+        virtual Any* copy() const = 0;
+        virtual bool operator==(const Any& rhs) const = 0;
+        virtual void print(std::ostream&) const = 0;
+    };
+
+    template <class T>
+    struct RealData : Any, std::tuple<T> {
+        using std::tuple<T>::tuple;
+
+        bool is(const std::type_info& id) const override {
+            return id == typeid(T);
+        }
+        Any* copy() const override {
+            return new RealData{get()};
+        }
+
+        T& get() & {
+            return std::get<0>(*static_cast<std::tuple<T>*>(this));
+        }
+
+        const T& get() const& {
+            return std::get<0>(*static_cast<const std::tuple<T>*>(this));
+        }
+
+        template <class U>
+        typename std::enable_if<!HasOperatorEqual<U>::value, bool>::type equal(const Any& left, const Any& rhs) const {
+            throw ov::Exception("Parameter doesn't contain equal operator");
+        }
+
+        template <class U>
+        typename std::enable_if<HasOperatorEqual<U>::value, bool>::type equal(const Any& left, const Any& rhs) const {
+            return dyn_cast<U>(&left) == dyn_cast<U>(&rhs);
+        }
+
+        bool operator==(const Any& rhs) const override {
+            return rhs.is(typeid(T)) && equal<T>(*this, rhs);
+        }
+
+        template <class U, typename std::enable_if<!HasOutputStreamOperator<U>::value, bool>::type = true>
+        void print(std::ostream& stream, const U& object) const {}
+
+        template <class U, typename std::enable_if<HasOutputStreamOperator<U>::value, bool>::type = true>
+        void print(std::ostream& stream, const U& object) const {
+            stream << object;
+        }
+
+        void print(std::ostream& stream) const override {
+            print<T>(stream, get());
+        }
+    };
+
+    template <typename T>
+    static T& dyn_cast(Any* obj) {
+        OPENVINO_ASSERT(obj != nullptr, "Parameter is empty!");
+        return dynamic_cast<RealData<T>&>(*obj).get();
+    }
+
+    template <typename T>
+    static const T& dyn_cast(const Any* obj) {
+        OPENVINO_ASSERT(obj != nullptr, "Parameter is empty!");
+        return dynamic_cast<const RealData<T>&>(*obj).get();
+    }
+
+    Any* ptr = nullptr;
+};
+
+/**
+ * @brief An std::map object containing parameters
+ */
+using ParamMap = std::map<std::string, Parameter>;
+
+#ifdef __ANDROID__
+extern template struct INFERENCE_ENGINE_API_CLASS(ov::runtime::Parameter::RealData<int>);
+extern template struct INFERENCE_ENGINE_API_CLASS(ov::runtime::Parameter::RealData<bool>);
+extern template struct INFERENCE_ENGINE_API_CLASS(ov::runtime::Parameter::RealData<float>);
+extern template struct INFERENCE_ENGINE_API_CLASS(ov::runtime::Parameter::RealData<uint32_t>);
+extern template struct INFERENCE_ENGINE_API_CLASS(ov::runtime::Parameter::RealData<std::string>);
+extern template struct INFERENCE_ENGINE_API_CLASS(ov::runtime::Parameter::RealData<unsigned long>);
+extern template struct INFERENCE_ENGINE_API_CLASS(ov::runtime::Parameter::RealData<std::vector<int>>);
+extern template struct INFERENCE_ENGINE_API_CLASS(ov::runtime::Parameter::RealData<std::vector<std::string>>);
+extern template struct INFERENCE_ENGINE_API_CLASS(ov::runtime::Parameter::RealData<std::vector<unsigned long>>);
+extern template struct INFERENCE_ENGINE_API_CLASS(
+    ov::runtime::Parameter::RealData<std::tuple<unsigned int, unsigned int>>);
+extern template struct INFERENCE_ENGINE_API_CLASS(
+    ov::runtime::Parameter::RealData<std::tuple<unsigned int, unsigned int, unsigned int>>);
+#endif
+
+}  // namespace runtime
+
+}  // namespace ov
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/remote_context.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/remote_context.hpp
index d174b6a6d5d..6cd2dd2fbed 100644
--- a/inference-engine/src/inference_engine/include/openvino/runtime/remote_context.hpp
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/remote_context.hpp
@@ -13,10 +13,9 @@
 #include <memory>
 #include <string>
 
-#include "common.hpp"
-#include "details/ie_so_loader.h"
-#include "ie_parameter.hpp"
 #include "ie_remote_context.hpp"
+#include "openvino/runtime/common.hpp"
+#include "openvino/runtime/parameter.hpp"
 
 namespace InferenceEngine {
 class RemoteBlob;
@@ -120,7 +119,7 @@ public:
      * Abstract method.
      * @return A pointer to plugin object that implements RemoteBlob interface.
      */
-    std::shared_ptr<ie::RemoteBlob> create_blob(const ie::TensorDesc& tensorDesc, const ie::ParamMap& params = {});
+    std::shared_ptr<ie::RemoteBlob> create_blob(const ie::TensorDesc& tensorDesc, const ParamMap& params = {});
 
     /**
      * @brief Returns a map of device-specific parameters required for low-level
@@ -131,7 +130,7 @@ public:
      * Abstract method.
      * @return A map of name/parameter elements.
      */
-    ie::ParamMap get_params() const;
+    ParamMap get_params() const;
 };
 
 }  // namespace runtime
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/runtime.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/runtime.hpp
new file mode 100644
index 00000000000..d08865dd7a6
--- /dev/null
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/runtime.hpp
@@ -0,0 +1,12 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+/**
+ * @brief This is a header file for the OpenVINO Runtime Components
+ *
+ * @file openvino/runtime/runtime.hpp
+ */
+#pragma once
+
+#include "openvino/runtime/core.hpp"
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/variable_state.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/variable_state.hpp
index e243a0a0f3b..49e07c3c2d2 100644
--- a/inference-engine/src/inference_engine/include/openvino/runtime/variable_state.hpp
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/variable_state.hpp
@@ -5,7 +5,7 @@
 /**
  * @brief A header file that provides VariableState
  *
- * @file variable_state.hpp
+ * @file openvino/runtime/variable_state.hpp
  */
 
 #pragma once
@@ -16,7 +16,7 @@
 #include <memory>
 #include <string>
 
-#include "common.hpp"
+#include "openvino/runtime/common.hpp"
 
 namespace InferenceEngine {
 class IVariableStateInternal;
diff --git a/inference-engine/src/inference_engine/src/cpp/ie_executable_network.cpp b/inference-engine/src/inference_engine/src/cpp/ie_executable_network.cpp
index dde888a82f7..3c6a7069d9f 100644
--- a/inference-engine/src/inference_engine/src/cpp/ie_executable_network.cpp
+++ b/inference-engine/src/inference_engine/src/cpp/ie_executable_network.cpp
@@ -9,6 +9,7 @@
 #include "ie_common.h"
 #include "ie_executable_network_base.hpp"
 #include "ie_remote_context.hpp"
+#include "openvino/core/except.hpp"
 #include "openvino/runtime/executable_network.hpp"
 
 namespace InferenceEngine {
@@ -22,6 +23,16 @@ namespace InferenceEngine {
         InferenceEngine::details::Rethrow();                                \
     }
 
+#define OV_EXEC_NET_CALL_STATEMENT(...)                                          \
+    OPENVINO_ASSERT(_impl != nullptr, "ExecutableNetwork was not initialized."); \
+    try {                                                                        \
+        __VA_ARGS__;                                                             \
+    } catch (const std::exception& ex) {                                         \
+        throw ov::Exception(ex.what());                                          \
+    } catch (...) {                                                              \
+        OPENVINO_ASSERT(false, "Unexpected exception");                          \
+    }
+
 ExecutableNetwork::ExecutableNetwork(const details::SharedObjectLoader& so, const IExecutableNetworkInternal::Ptr& impl)
     : _so(so),
       _impl(impl) {
@@ -115,43 +126,43 @@ ExecutableNetwork::ExecutableNetwork(const std::shared_ptr<void>& so,
                                      const std::shared_ptr<ie::IExecutableNetworkInternal>& impl)
     : _so{so},
       _impl{impl} {
-    IE_ASSERT(_impl != nullptr);
+    OPENVINO_ASSERT(_impl != nullptr, "ExecutableNetwork was not initialized.");
 }
 
 std::shared_ptr<const Function> ExecutableNetwork::get_runtime_function() const {
-    EXEC_NET_CALL_STATEMENT(return std::const_pointer_cast<const Function>(_impl->GetExecGraphInfo()));
+    OV_EXEC_NET_CALL_STATEMENT(return std::const_pointer_cast<const Function>(_impl->GetExecGraphInfo()));
 }
 
 ParameterVector ExecutableNetwork::get_parameters() const {
-    EXEC_NET_CALL_STATEMENT(return _impl->GetExecGraphInfo()->get_parameters());
+    OV_EXEC_NET_CALL_STATEMENT(return _impl->GetExecGraphInfo()->get_parameters());
 }
 
 ResultVector ExecutableNetwork::get_results() const {
-    EXEC_NET_CALL_STATEMENT(return _impl->GetExecGraphInfo()->get_results());
+    OV_EXEC_NET_CALL_STATEMENT(return _impl->GetExecGraphInfo()->get_results());
 }
 
 InferRequest ExecutableNetwork::create_infer_request() {
-    EXEC_NET_CALL_STATEMENT(return {_so, _impl->CreateInferRequest()});
+    OV_EXEC_NET_CALL_STATEMENT(return {_so, _impl->CreateInferRequest()});
 }
 
 void ExecutableNetwork::export_model(std::ostream& networkModel) {
-    EXEC_NET_CALL_STATEMENT(_impl->Export(networkModel));
+    OV_EXEC_NET_CALL_STATEMENT(_impl->Export(networkModel));
 }
 
 void ExecutableNetwork::set_config(const ie::ParamMap& config) {
-    EXEC_NET_CALL_STATEMENT(_impl->SetConfig(config));
+    OV_EXEC_NET_CALL_STATEMENT(_impl->SetConfig(config));
 }
 
 ie::Parameter ExecutableNetwork::get_config(const std::string& name) const {
-    EXEC_NET_CALL_STATEMENT(return _impl->GetConfig(name));
+    OV_EXEC_NET_CALL_STATEMENT(return _impl->GetConfig(name));
 }
 
 ie::Parameter ExecutableNetwork::get_metric(const std::string& name) const {
-    EXEC_NET_CALL_STATEMENT(return _impl->GetMetric(name));
+    OV_EXEC_NET_CALL_STATEMENT(return _impl->GetMetric(name));
 }
 
 std::shared_ptr<ie::RemoteContext> ExecutableNetwork::get_context() const {
-    EXEC_NET_CALL_STATEMENT(return _impl->GetContext());
+    OV_EXEC_NET_CALL_STATEMENT(return _impl->GetContext());
 }
 
 bool ExecutableNetwork::operator!() const noexcept {
diff --git a/inference-engine/src/inference_engine/src/cpp/ie_infer_request.cpp b/inference-engine/src/inference_engine/src/cpp/ie_infer_request.cpp
index 94b53157723..0253c23321f 100644
--- a/inference-engine/src/inference_engine/src/cpp/ie_infer_request.cpp
+++ b/inference-engine/src/inference_engine/src/cpp/ie_infer_request.cpp
@@ -13,6 +13,7 @@
 #include "details/ie_so_loader.h"
 #include "ie_infer_async_request_base.hpp"
 #include "ie_remote_context.hpp"
+#include "openvino/core/except.hpp"
 #include "openvino/runtime/infer_request.hpp"
 
 namespace InferenceEngine {
@@ -26,6 +27,16 @@ namespace InferenceEngine {
         ::InferenceEngine::details::Rethrow();                            \
     }
 
+#define OV_INFER_REQ_CALL_STATEMENT(...)                                    \
+    OPENVINO_ASSERT(_impl != nullptr, "InferRequest was not initialized."); \
+    try {                                                                   \
+        __VA_ARGS__;                                                        \
+    } catch (const std::exception& ex) {                                    \
+        throw ov::Exception(ex.what());                                     \
+    } catch (...) {                                                         \
+        OPENVINO_ASSERT(false, "Unexpected exception");                     \
+    }
+
 InferRequest::InferRequest(const details::SharedObjectLoader& so, const IInferRequestInternal::Ptr& impl)
     : _so(so),
       _impl(impl) {
@@ -199,16 +210,16 @@ namespace runtime {
 InferRequest::InferRequest(const std::shared_ptr<void>& so, const ie::IInferRequestInternal::Ptr& impl)
     : _so{so},
       _impl{impl} {
-    IE_ASSERT(_impl != nullptr);
+    OPENVINO_ASSERT(_impl != nullptr, "InferRequest was not initialized.");
 }
 
 void InferRequest::set_blob(const std::string& name, const ie::Blob::Ptr& data) {
-    INFER_REQ_CALL_STATEMENT(_impl->SetBlob(name, data);)
+    OV_INFER_REQ_CALL_STATEMENT(_impl->SetBlob(name, data);)
 }
 
 ie::Blob::Ptr InferRequest::get_blob(const std::string& name) {
     ie::Blob::Ptr blobPtr;
-    INFER_REQ_CALL_STATEMENT(blobPtr = _impl->GetBlob(name);)
+    OV_INFER_REQ_CALL_STATEMENT(blobPtr = _impl->GetBlob(name);)
     std::string error = "Internal error: blob with name `" + name + "` is not allocated!";
     const bool remoteBlobPassed = blobPtr->is<ie::RemoteBlob>();
     if (blobPtr == nullptr)
@@ -219,15 +230,15 @@ ie::Blob::Ptr InferRequest::get_blob(const std::string& name) {
 }
 
 void InferRequest::infer() {
-    INFER_REQ_CALL_STATEMENT(_impl->Infer();)
+    OV_INFER_REQ_CALL_STATEMENT(_impl->Infer();)
 }
 
 void InferRequest::cancel() {
-    INFER_REQ_CALL_STATEMENT(_impl->Cancel();)
+    OV_INFER_REQ_CALL_STATEMENT(_impl->Cancel();)
 }
 
 std::vector<ProfilingInfo> InferRequest::get_profiling_info() const {
-    INFER_REQ_CALL_STATEMENT({
+    OV_INFER_REQ_CALL_STATEMENT({
         auto ieInfos = _impl->GetPerformanceCounts();
         std::vector<ProfilingInfo> infos;
         infos.reserve(ieInfos.size());
@@ -265,36 +276,36 @@ std::vector<ProfilingInfo> InferRequest::get_profiling_info() const {
 }
 
 void InferRequest::set_input(const ie::BlobMap& inputs) {
-    INFER_REQ_CALL_STATEMENT(for (auto&& input : inputs) { _impl->SetBlob(input.first, input.second); })
+    OV_INFER_REQ_CALL_STATEMENT(for (auto&& input : inputs) { _impl->SetBlob(input.first, input.second); })
 }
 
 void InferRequest::set_output(const ie::BlobMap& results) {
-    INFER_REQ_CALL_STATEMENT(for (auto&& result : results) { _impl->SetBlob(result.first, result.second); })
+    OV_INFER_REQ_CALL_STATEMENT(for (auto&& result : results) { _impl->SetBlob(result.first, result.second); })
 }
 
 void InferRequest::set_batch(const int batch) {
-    INFER_REQ_CALL_STATEMENT(_impl->SetBatch(batch);)
+    OV_INFER_REQ_CALL_STATEMENT(_impl->SetBatch(batch);)
 }
 
 void InferRequest::start_async() {
-    INFER_REQ_CALL_STATEMENT(_impl->StartAsync();)
+    OV_INFER_REQ_CALL_STATEMENT(_impl->StartAsync();)
 }
 
 void InferRequest::wait() {
-    INFER_REQ_CALL_STATEMENT(_impl->Wait(ie::InferRequest::RESULT_READY);)
+    OV_INFER_REQ_CALL_STATEMENT(_impl->Wait(ie::InferRequest::RESULT_READY);)
 }
 
 bool InferRequest::wait_for(const std::chrono::milliseconds timeout) {
-    INFER_REQ_CALL_STATEMENT(return _impl->Wait(timeout.count()) == ie::OK;)
+    OV_INFER_REQ_CALL_STATEMENT(return _impl->Wait(timeout.count()) == ie::OK;)
 }
 
 void InferRequest::set_callback(std::function<void(std::exception_ptr)> callback) {
-    INFER_REQ_CALL_STATEMENT(_impl->SetCallback(std::move(callback));)
+    OV_INFER_REQ_CALL_STATEMENT(_impl->SetCallback(std::move(callback));)
 }
 
 std::vector<VariableState> InferRequest::query_state() {
     std::vector<VariableState> variable_states;
-    INFER_REQ_CALL_STATEMENT({
+    OV_INFER_REQ_CALL_STATEMENT({
         for (auto&& state : _impl->QueryState()) {
             variable_states.emplace_back(VariableState{_so, state});
         }
diff --git a/inference-engine/src/inference_engine/src/cpp/ie_plugin.hpp b/inference-engine/src/inference_engine/src/cpp/ie_plugin.hpp
index 1b74aea1ce5..8631812dc6e 100644
--- a/inference-engine/src/inference_engine/src/cpp/ie_plugin.hpp
+++ b/inference-engine/src/inference_engine/src/cpp/ie_plugin.hpp
@@ -126,6 +126,14 @@ public:
 namespace ov {
 namespace runtime {
 
+#define OV_PLUGIN_CALL_STATEMENT(...)                                         \
+    OPENVINO_ASSERT(_ptr != nullptr, "InferencePlugin was not initialized."); \
+    try {                                                                     \
+        __VA_ARGS__;                                                          \
+    } catch (...) {                                                           \
+        ::InferenceEngine::details::Rethrow();                                \
+    }
+
 /**
  * @brief This class is a C++ API wrapper for IInferencePlugin.
  *
@@ -138,85 +146,86 @@ struct InferencePlugin {
     InferencePlugin(const std::shared_ptr<void>& so, const std::shared_ptr<ie::IInferencePlugin>& impl) :
         _so{so},
         _ptr{impl} {
-        IE_ASSERT(_ptr != nullptr);
+        OPENVINO_ASSERT(_ptr != nullptr, "InferencePlugin was not initialized.");
     }
 
     void set_name(const std::string& deviceName) {
-        PLUGIN_CALL_STATEMENT(_ptr->SetName(deviceName));
+        OV_PLUGIN_CALL_STATEMENT(_ptr->SetName(deviceName));
     }
 
     void set_core(std::weak_ptr<ie::ICore> core) {
-        PLUGIN_CALL_STATEMENT(_ptr->SetCore(core));
+        OV_PLUGIN_CALL_STATEMENT(_ptr->SetCore(core));
     }
 
     const ie::Version get_version() const {
-        PLUGIN_CALL_STATEMENT(return _ptr->GetVersion());
+        OV_PLUGIN_CALL_STATEMENT(return _ptr->GetVersion());
     }
 
     void add_extension(const ie::IExtensionPtr& extension) {
-        PLUGIN_CALL_STATEMENT(_ptr->AddExtension(extension));
+        OV_PLUGIN_CALL_STATEMENT(_ptr->AddExtension(extension));
     }
 
     void set_config(const ConfigMap& config) {
-        PLUGIN_CALL_STATEMENT(_ptr->SetConfig(config));
+        OV_PLUGIN_CALL_STATEMENT(_ptr->SetConfig(config));
     }
 
-    SoPtr<ie::IExecutableNetworkInternal> load_model(const ie::CNNNetwork& network, const ConfigMap& config) {
-        PLUGIN_CALL_STATEMENT(return {_so, _ptr->LoadNetwork(network, config)});
+    SoPtr<ie::IExecutableNetworkInternal> compile_model(const ie::CNNNetwork& network, const ConfigMap& config) {
+        OV_PLUGIN_CALL_STATEMENT(return {_so, _ptr->LoadNetwork(network, config)});
     }
 
-    SoPtr<ie::IExecutableNetworkInternal> load_model(const ie::CNNNetwork& network,
-                                                               const std::shared_ptr<ie::RemoteContext>& context,
-                                                               const ConfigMap& config) {
-        PLUGIN_CALL_STATEMENT(return {_so, _ptr->LoadNetwork(network, config, context)});
+    SoPtr<ie::IExecutableNetworkInternal> compile_model(const ie::CNNNetwork& network,
+                                                        const std::shared_ptr<ie::RemoteContext>& context,
+                                                        const ConfigMap& config) {
+        OV_PLUGIN_CALL_STATEMENT(return {_so, _ptr->LoadNetwork(network, config, context)});
     }
 
-    SoPtr<ie::IExecutableNetworkInternal> load_model(const std::string& modelPath, const ConfigMap& config) {
-        PLUGIN_CALL_STATEMENT(return {_so, _ptr->LoadNetwork(modelPath, config)});
+    SoPtr<ie::IExecutableNetworkInternal> compile_model(const std::string& modelPath, const ConfigMap& config) {
+        OV_PLUGIN_CALL_STATEMENT(return {_so, _ptr->LoadNetwork(modelPath, config)});
     }
 
     ie::QueryNetworkResult query_model(const ie::CNNNetwork& network,
                                        const ConfigMap& config) const {
         ie::QueryNetworkResult res;
-        PLUGIN_CALL_STATEMENT(res = _ptr->QueryNetwork(network, config));
-        if (res.rc != ie::OK) IE_THROW() << res.resp.msg;
+        OV_PLUGIN_CALL_STATEMENT(res = _ptr->QueryNetwork(network, config));
+        OPENVINO_ASSERT(res.rc == ie::OK, res.resp.msg);
         return res;
     }
 
     SoPtr<ie::IExecutableNetworkInternal> import_model(const std::string& modelFileName,
-                                                                 const ConfigMap& config) {
-        PLUGIN_CALL_STATEMENT(return {_so, _ptr->ImportNetwork(modelFileName, config)});
+                                                       const ConfigMap& config) {
+        OV_PLUGIN_CALL_STATEMENT(return {_so, _ptr->ImportNetwork(modelFileName, config)});
     }
 
     SoPtr<ie::IExecutableNetworkInternal> import_model(std::istream& networkModel,
                                     const ConfigMap& config) {
-        PLUGIN_CALL_STATEMENT(return {_so, _ptr->ImportNetwork(networkModel, config)});
+        OV_PLUGIN_CALL_STATEMENT(return {_so, _ptr->ImportNetwork(networkModel, config)});
     }
 
     SoPtr<ie::IExecutableNetworkInternal> import_model(std::istream& networkModel,
-                                                                 const std::shared_ptr<ie::RemoteContext>& context,
-                                                                 const ConfigMap& config) {
-        PLUGIN_CALL_STATEMENT(return {_so, _ptr->ImportNetwork(networkModel, context, config)});
+                                                       const std::shared_ptr<ie::RemoteContext>& context,
+                                                       const ConfigMap& config) {
+        OV_PLUGIN_CALL_STATEMENT(return {_so, _ptr->ImportNetwork(networkModel, context, config)});
     }
 
     ie::Parameter get_metric(const std::string& name, const ie::ParamMap& options) const {
-        PLUGIN_CALL_STATEMENT(return _ptr->GetMetric(name, options));
+        OV_PLUGIN_CALL_STATEMENT(return _ptr->GetMetric(name, options));
     }
 
     SoPtr<ie::RemoteContext> create_context(const ie::ParamMap& params) {
-        PLUGIN_CALL_STATEMENT(return {_so, _ptr->CreateContext(params)});
+        OV_PLUGIN_CALL_STATEMENT(return {_so, _ptr->CreateContext(params)});
     }
 
     SoPtr<ie::RemoteContext> get_default_context(const ie::ParamMap& params) {
-        PLUGIN_CALL_STATEMENT(return {_so, _ptr->GetDefaultContext(params)});
+        OV_PLUGIN_CALL_STATEMENT(return {_so, _ptr->GetDefaultContext(params)});
     }
 
     ie::Parameter get_config(const std::string& name, const ie::ParamMap& options) const {
-        PLUGIN_CALL_STATEMENT(return _ptr->GetConfig(name, options));
+        OV_PLUGIN_CALL_STATEMENT(return _ptr->GetConfig(name, options));
     }
 };
 
 }  // namespace runtime
 }  // namespace ov
 
-#undef PLUGIN_CALL_STATEMENT
\ No newline at end of file
+#undef PLUGIN_CALL_STATEMENT
+#undef OV_PLUGIN_CALL_STATEMENT
diff --git a/inference-engine/src/inference_engine/src/remote_context.cpp b/inference-engine/src/inference_engine/src/cpp/ie_remote_context.cpp
similarity index 55%
rename from inference-engine/src/inference_engine/src/remote_context.cpp
rename to inference-engine/src/inference_engine/src/cpp/ie_remote_context.cpp
index 62913b54537..79ec884050e 100644
--- a/inference-engine/src/inference_engine/src/remote_context.cpp
+++ b/inference-engine/src/inference_engine/src/cpp/ie_remote_context.cpp
@@ -2,18 +2,20 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include "openvino/runtime/remote_context.hpp"
-
-#include "ie_remote_blob.hpp"
 #include "ie_remote_context.hpp"
 
-#define REMOTE_CONTEXT_STATEMENT(...)                                   \
-    if (_impl == nullptr)                                               \
-        IE_THROW(NotAllocated) << "RemoteContext was not initialized."; \
-    try {                                                               \
-        __VA_ARGS__;                                                    \
-    } catch (...) {                                                     \
-        ::InferenceEngine::details::Rethrow();                          \
+#include <exception>
+
+#include "ie_remote_blob.hpp"
+#include "openvino/core/except.hpp"
+#include "openvino/runtime/remote_context.hpp"
+
+#define OV_REMOTE_CONTEXT_STATEMENT(...)                                     \
+    OPENVINO_ASSERT(_impl != nullptr, "RemoteContext was not initialized."); \
+    try {                                                                    \
+        __VA_ARGS__;                                                         \
+    } catch (const std::exception& ex) {                                     \
+        throw ov::Exception(ex.what());                                      \
     }
 
 namespace ov {
@@ -22,21 +24,20 @@ namespace runtime {
 RemoteContext::RemoteContext(const std::shared_ptr<void>& so, const ie::RemoteContext::Ptr& impl)
     : _so(so),
       _impl(impl) {
-    if (_impl == nullptr)
-        IE_THROW() << "RemoteContext was not initialized.";
+    OPENVINO_ASSERT(_impl != nullptr, "RemoteContext was not initialized.");
 }
 
 std::string RemoteContext::get_device_name() const {
-    REMOTE_CONTEXT_STATEMENT(return _impl->getDeviceName());
+    OV_REMOTE_CONTEXT_STATEMENT(return _impl->getDeviceName());
 }
 
 std::shared_ptr<ie::RemoteBlob> RemoteContext::create_blob(const ie::TensorDesc& tensorDesc,
                                                            const ie::ParamMap& params) {
-    REMOTE_CONTEXT_STATEMENT(return _impl->CreateBlob(tensorDesc, params));
+    OV_REMOTE_CONTEXT_STATEMENT(return _impl->CreateBlob(tensorDesc, params));
 }
 
 ie::ParamMap RemoteContext::get_params() const {
-    REMOTE_CONTEXT_STATEMENT(return _impl->getParams());
+    OV_REMOTE_CONTEXT_STATEMENT(return _impl->getParams());
 }
 
 }  // namespace runtime
diff --git a/inference-engine/src/inference_engine/src/cpp/ie_variable_state.cpp b/inference-engine/src/inference_engine/src/cpp/ie_variable_state.cpp
index 67e6172d11e..16d347fd490 100644
--- a/inference-engine/src/inference_engine/src/cpp/ie_variable_state.cpp
+++ b/inference-engine/src/inference_engine/src/cpp/ie_variable_state.cpp
@@ -4,8 +4,7 @@
 
 #include "cpp/ie_memory_state.hpp"
 #include "cpp_interfaces/interface/ie_ivariable_state_internal.hpp"
-#include "details/ie_so_loader.h"
-#include "exception2status.hpp"
+#include "openvino/core/except.hpp"
 #include "openvino/runtime/variable_state.hpp"
 
 #define VARIABLE_CALL_STATEMENT(...)                                    \
@@ -17,6 +16,16 @@
         ::InferenceEngine::details::Rethrow();                          \
     }
 
+#define OV_VARIABLE_CALL_STATEMENT(...)                                      \
+    OPENVINO_ASSERT(_impl != nullptr, "VariableState was not initialized."); \
+    try {                                                                    \
+        __VA_ARGS__;                                                         \
+    } catch (const std::exception& ex) {                                     \
+        throw ov::Exception(ex.what());                                      \
+    } catch (...) {                                                          \
+        OPENVINO_ASSERT(false, "Unexpected exception");                      \
+    }
+
 namespace InferenceEngine {
 
 VariableState::VariableState(const details::SharedObjectLoader& so, const IVariableStateInternal::Ptr& impl)
@@ -52,23 +61,23 @@ namespace runtime {
 VariableState::VariableState(const std::shared_ptr<void>& so, const ie::IVariableStateInternal::Ptr& impl)
     : _so{so},
       _impl{impl} {
-    IE_ASSERT(_impl != nullptr);
+    OPENVINO_ASSERT(_impl != nullptr, "VariableState was not initialized.");
 }
 
 void VariableState::reset() {
-    VARIABLE_CALL_STATEMENT(_impl->Reset());
+    OV_VARIABLE_CALL_STATEMENT(_impl->Reset());
 }
 
 std::string VariableState::get_name() const {
-    VARIABLE_CALL_STATEMENT(return _impl->GetName());
+    OV_VARIABLE_CALL_STATEMENT(return _impl->GetName());
 }
 
 ie::Blob::CPtr VariableState::get_state() const {
-    VARIABLE_CALL_STATEMENT(return _impl->GetState());
+    OV_VARIABLE_CALL_STATEMENT(return _impl->GetState());
 }
 
 void VariableState::set_state(const ie::Blob::Ptr& state) {
-    VARIABLE_CALL_STATEMENT(_impl->SetState(state));
+    OV_VARIABLE_CALL_STATEMENT(_impl->SetState(state));
 }
 
 }  // namespace runtime
diff --git a/inference-engine/src/inference_engine/src/file_utils.cpp b/inference-engine/src/inference_engine/src/file_utils.cpp
index 3a72787063d..a794a396cd0 100644
--- a/inference-engine/src/inference_engine/src/file_utils.cpp
+++ b/inference-engine/src/inference_engine/src/file_utils.cpp
@@ -66,39 +66,9 @@
 
 #endif
 
-#ifdef ENABLE_UNICODE_PATH_SUPPORT
-
-std::string FileUtils::wStringtoMBCSstringChar(const std::wstring& wstr) {
-#    ifdef _WIN32
-    int size_needed = WideCharToMultiByte(CP_UTF8, 0, &wstr[0], (int)wstr.size(), NULL, 0, NULL, NULL);
-    std::string strTo(size_needed, 0);
-    WideCharToMultiByte(CP_UTF8, 0, &wstr[0], (int)wstr.size(), &strTo[0], size_needed, NULL, NULL);
-    return strTo;
-#    else
-    std::wstring_convert<std::codecvt_utf8<wchar_t>> wstring_decoder;
-    return wstring_decoder.to_bytes(wstr);
-#    endif
-}
-
-std::wstring FileUtils::multiByteCharToWString(const char* str) {
-#    ifdef _WIN32
-    int strSize = static_cast<int>(std::strlen(str));
-    int size_needed = MultiByteToWideChar(CP_UTF8, 0, str, strSize, NULL, 0);
-    std::wstring wstrTo(size_needed, 0);
-    MultiByteToWideChar(CP_UTF8, 0, str, strSize, &wstrTo[0], size_needed);
-    return wstrTo;
-#    else
-    std::wstring_convert<std::codecvt_utf8<wchar_t>> wstring_encoder;
-    std::wstring result = wstring_encoder.from_bytes(str);
-    return result;
-#    endif
-}
-
-#endif  // ENABLE_UNICODE_PATH_SUPPORT
-
 long long FileUtils::fileSize(const char* charfilepath) {
 #if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-    std::wstring widefilename = FileUtils::multiByteCharToWString(charfilepath);
+    std::wstring widefilename = ov::util::string_to_wstring(charfilepath);
     const wchar_t* fileName = widefilename.c_str();
 #elif defined(__ANDROID__) || defined(ANDROID)
     std::string fileName = charfilepath;
@@ -138,7 +108,7 @@ void FileUtils::createDirectoryRecursive(const std::string& dirPath) {
         return;
     }
 
-    std::size_t pos = dirPath.rfind(FileUtils::FileSeparator);
+    std::size_t pos = dirPath.rfind(ov::util::FileTraits<char>::file_separator);
     if (pos != std::string::npos) {
         createDirectoryRecursive(dirPath.substr(0, pos));
     }
@@ -156,7 +126,7 @@ namespace {
 
 template <typename C, typename = InferenceEngine::details::enableIfSupportedChar<C>>
 std::basic_string<C> getPathName(const std::basic_string<C>& s) {
-    size_t i = s.rfind(FileUtils::FileTraits<C>::FileSeparator, s.length());
+    size_t i = s.rfind(ov::util::FileTraits<C>::file_separator, s.length());
     if (i != std::string::npos) {
         return (s.substr(0, i));
     }
@@ -213,7 +183,7 @@ std::wstring getIELibraryPathW() {
     GetModuleFileNameW(hm, (LPWSTR)ie_library_path, sizeof(ie_library_path) / sizeof(ie_library_path[0]));
     return getPathName(std::wstring(ie_library_path));
 #    elif defined(__linux__) || defined(__APPLE__)
-    return ::FileUtils::multiByteCharToWString(getIELibraryPathA().c_str());
+    return ::ov::util::string_to_wstring(getIELibraryPathA().c_str());
 #    else
 #        error "Unsupported OS"
 #    endif
@@ -223,7 +193,7 @@ std::wstring getIELibraryPathW() {
 
 std::string getIELibraryPath() {
 #ifdef ENABLE_UNICODE_PATH_SUPPORT
-    return FileUtils::wStringtoMBCSstringChar(getIELibraryPathW());
+    return ov::util::wstring_to_string(getIELibraryPathW());
 #else
     return getIELibraryPathA();
 #endif
diff --git a/inference-engine/src/inference_engine/src/ie_blob_common.cpp b/inference-engine/src/inference_engine/src/ie_blob_common.cpp
index 444d8e3d232..fc5d9b9144f 100644
--- a/inference-engine/src/inference_engine/src/ie_blob_common.cpp
+++ b/inference-engine/src/inference_engine/src/ie_blob_common.cpp
@@ -9,13 +9,26 @@
 #include "ie_blob.h"
 
 namespace InferenceEngine {
-
-Blob::Ptr Blob::createROI(const ROI&) const {
+Blob::Ptr Blob::createROI(const ROI& roi) const {
+    if (getTensorDesc().getLayout() == Layout::NCHW || getTensorDesc().getLayout() == Layout::NHWC) {
+        return createROI({roi.id, 0, roi.posY, roi.posX},
+                         {roi.id + 1, getTensorDesc().getDims()[1], roi.posY + roi.sizeY, roi.posX + roi.sizeX});
+    }
     IE_THROW(NotImplemented) << "createROI is not implemented for current type of Blob";
 }
 
+Blob::Ptr Blob::createROI(const std::vector<std::size_t>& begin, const std::vector<std::size_t>& end) const {
+    IE_THROW(NotImplemented) << "createROI is not implemented for current type of Blob or roi";
+}
+
 Blob::Ptr make_shared_blob(const Blob::Ptr& inputBlob, const ROI& roi) {
     return inputBlob->createROI(roi);
 }
 
+Blob::Ptr make_shared_blob(const Blob::Ptr& inputBlob,
+                           const std::vector<std::size_t>& begin,
+                           const std::vector<std::size_t>& end) {
+    return inputBlob->createROI(begin, end);
+}
+
 }  // namespace InferenceEngine
diff --git a/inference-engine/src/inference_engine/src/ie_common.cpp b/inference-engine/src/inference_engine/src/ie_common.cpp
index 37b791631a3..09d1333a444 100644
--- a/inference-engine/src/inference_engine/src/ie_common.cpp
+++ b/inference-engine/src/inference_engine/src/ie_common.cpp
@@ -127,32 +127,6 @@ StatusCode InferenceEngineException::getStatus() const {
 }  // namespace details
 IE_SUPPRESS_DEPRECATED_END
 
-//
-// ie_parameter.hpp
-//
-
-Parameter::~Parameter() {
-    clear();
-}
-
-#ifdef __ANDROID__
-Parameter::Any::~Any() {}
-
-template struct Parameter::RealData<int>;
-template struct Parameter::RealData<bool>;
-template struct Parameter::RealData<float>;
-template struct Parameter::RealData<double>;
-template struct Parameter::RealData<uint32_t>;
-template struct Parameter::RealData<std::string>;
-template struct Parameter::RealData<unsigned long>;
-template struct Parameter::RealData<std::vector<int>>;
-template struct Parameter::RealData<std::vector<std::string>>;
-template struct Parameter::RealData<std::vector<unsigned long>>;
-template struct Parameter::RealData<std::tuple<unsigned int, unsigned int>>;
-template struct Parameter::RealData<std::tuple<unsigned int, unsigned int, unsigned int>>;
-template struct Parameter::RealData<Blob::Ptr>;
-#endif
-
 //
 // ie_blob.h
 //
@@ -178,3 +152,37 @@ template class INFERENCE_ENGINE_API_CLASS(TBlob<bool>);
 template class INFERENCE_ENGINE_API_CLASS(TBlob<char>);
 
 }  // namespace InferenceEngine
+
+namespace ov {
+
+namespace runtime {
+
+//
+// openvino/runtime/parameter.hpp
+//
+
+Parameter::~Parameter() {
+    clear();
+}
+
+#ifdef __ANDROID__
+Parameter::Any::~Any() {}
+
+template struct Parameter::RealData<InferenceEngine::Blob::Ptr>;
+template struct Parameter::RealData<int>;
+template struct Parameter::RealData<bool>;
+template struct Parameter::RealData<float>;
+template struct Parameter::RealData<double>;
+template struct Parameter::RealData<uint32_t>;
+template struct Parameter::RealData<std::string>;
+template struct Parameter::RealData<unsigned long>;
+template struct Parameter::RealData<std::vector<int>>;
+template struct Parameter::RealData<std::vector<std::string>>;
+template struct Parameter::RealData<std::vector<unsigned long>>;
+template struct Parameter::RealData<std::tuple<unsigned int, unsigned int>>;
+template struct Parameter::RealData<std::tuple<unsigned int, unsigned int, unsigned int>>;
+#endif
+
+}  // namespace runtime
+
+}  // namespace ov
diff --git a/inference-engine/src/inference_engine/src/ie_core.cpp b/inference-engine/src/inference_engine/src/ie_core.cpp
index cd15015fa82..446c7f8028d 100644
--- a/inference-engine/src/inference_engine/src/ie_core.cpp
+++ b/inference-engine/src/inference_engine/src/ie_core.cpp
@@ -28,8 +28,10 @@
 #include "ngraph/ngraph.hpp"
 #include "ngraph/opsets/opset.hpp"
 #include "ngraph/pass/constant_folding.hpp"
+#include "openvino/core/except.hpp"
 #include "openvino/runtime/core.hpp"
 #include "openvino/runtime/executable_network.hpp"
+#include "openvino/util/file_util.hpp"
 #include "xml_parse_utils.h"
 
 using namespace InferenceEngine::PluginConfigParams;
@@ -48,9 +50,9 @@ std::string parseXmlConfig(const std::string& xmlFile) {
     std::string xmlConfigFile_ = xmlFile;
     if (xmlConfigFile_.empty()) {
         // register plugins from default plugins.xml config
-        FileUtils::FilePath xmlConfigFileDefault =
-            FileUtils::makePath(ie::getInferenceEngineLibraryPath(), FileUtils::toFilePath("plugins.xml"));
-        xmlConfigFile_ = FileUtils::fromFilePath(xmlConfigFileDefault);
+        ov::util::FilePath xmlConfigFileDefault =
+            FileUtils::makePath(ie::getInferenceEngineLibraryPath(), ov::util::to_file_path("plugins.xml"));
+        xmlConfigFile_ = ov::util::from_file_path(xmlConfigFileDefault);
     }
     return xmlConfigFile_;
 }
@@ -165,9 +167,9 @@ class CoreImpl : public ie::ICore, public std::enable_shared_from_this<ie::ICore
     ie::CacheGuard cacheGuard;
 
     struct PluginDescriptor {
-        FileUtils::FilePath libraryLocation;
+        ov::util::FilePath libraryLocation;
         std::map<std::string, std::string> defaultConfig;
-        std::vector<FileUtils::FilePath> listOfExtentions;
+        std::vector<ov::util::FilePath> listOfExtentions;
     };
 
     mutable std::unordered_set<std::string> opsetNames;
@@ -209,7 +211,7 @@ class CoreImpl : public ie::ICore, public std::enable_shared_from_this<ie::ICore
         return supported;
     }
 
-    ov::runtime::SoPtr<ie::IExecutableNetworkInternal> load_model_impl(
+    ov::runtime::SoPtr<ie::IExecutableNetworkInternal> compile_model_impl(
         const InferenceEngine::CNNNetwork& network,
         InferencePlugin& plugin,
         const std::map<std::string, std::string>& parsedConfig,
@@ -217,10 +219,10 @@ class CoreImpl : public ie::ICore, public std::enable_shared_from_this<ie::ICore
         const std::string& blobID,
         const std::string& modelPath = std::string(),
         bool forceDisableCache = false) {
-        OV_ITT_SCOPED_TASK(ov::itt::domains::IE, "CoreImpl::load_model_impl");
+        OV_ITT_SCOPED_TASK(ov::itt::domains::IE, "CoreImpl::compile_model_impl");
         ov::runtime::SoPtr<ie::IExecutableNetworkInternal> execNetwork;
-        execNetwork =
-            context ? plugin.load_model(network, context, parsedConfig) : plugin.load_model(network, parsedConfig);
+        execNetwork = context ? plugin.compile_model(network, context, parsedConfig)
+                              : plugin.compile_model(network, parsedConfig);
         auto cacheManager = coreConfig.getCacheConfig()._cacheManager;
         if (!forceDisableCache && cacheManager && DeviceSupportsImportExport(plugin)) {
             try {
@@ -251,7 +253,7 @@ class CoreImpl : public ie::ICore, public std::enable_shared_from_this<ie::ICore
         ov::runtime::SoPtr<ie::IExecutableNetworkInternal> execNetwork;
         struct HeaderException {};
 
-        IE_ASSERT(cacheManager != nullptr);
+        OPENVINO_ASSERT(cacheManager != nullptr);
         try {
             cacheManager->readCacheEntry(blobId, [&](std::istream& networkStream) {
                 OV_ITT_SCOPE(FIRST_INFERENCE,
@@ -374,7 +376,7 @@ public:
 
         FOREACH_CHILD (pluginNode, devicesNode, "plugin") {
             std::string deviceName = GetStrAttr(pluginNode, "name");
-            FileUtils::FilePath pluginPath = FileUtils::toFilePath(GetStrAttr(pluginNode, "location").c_str());
+            ov::util::FilePath pluginPath = ov::util::to_file_path(GetStrAttr(pluginNode, "location").c_str());
 
             if (deviceName.find('.') != std::string::npos) {
                 IE_THROW() << "Device name must not contain dot '.' symbol";
@@ -382,7 +384,7 @@ public:
 
             // append IR library path for default IE plugins
             {
-                FileUtils::FilePath absFilePath = FileUtils::makePath(ie::getInferenceEngineLibraryPath(), pluginPath);
+                ov::util::FilePath absFilePath = FileUtils::makePath(ie::getInferenceEngineLibraryPath(), pluginPath);
                 if (FileUtils::fileExist(absFilePath))
                     pluginPath = absFilePath;
             }
@@ -401,12 +403,12 @@ public:
 
             // check extensions
             auto extensionsNode = pluginNode.child("extensions");
-            std::vector<FileUtils::FilePath> listOfExtentions;
+            std::vector<ov::util::FilePath> listOfExtentions;
 
             if (extensionsNode) {
                 FOREACH_CHILD (extensionNode, extensionsNode, "extension") {
-                    FileUtils::FilePath extensionLocation =
-                        FileUtils::toFilePath(GetStrAttr(extensionNode, "location").c_str());
+                    ov::util::FilePath extensionLocation =
+                        ov::util::to_file_path(GetStrAttr(extensionNode, "location").c_str());
                     listOfExtentions.push_back(extensionLocation);
                 }
             }
@@ -459,10 +461,10 @@ public:
             auto lock = cacheGuard.getHashLock(hash);
             res = LoadNetworkFromCache(cacheManager, hash, plugin, parsed._config, context, loadedFromCache);
             if (!loadedFromCache) {
-                res = load_model_impl(network, plugin, parsed._config, context, hash);
+                res = compile_model_impl(network, plugin, parsed._config, context, hash);
             }
         } else {
-            res = load_model_impl(network, plugin, parsed._config, context, {});
+            res = compile_model_impl(network, plugin, parsed._config, context, {});
         }
         return res;
     }
@@ -486,10 +488,10 @@ public:
             auto lock = cacheGuard.getHashLock(hash);
             res = LoadNetworkFromCache(cacheManager, hash, plugin, parsed._config, nullptr, loadedFromCache);
             if (!loadedFromCache) {
-                res = load_model_impl(network, plugin, parsed._config, nullptr, hash, {}, forceDisableCache);
+                res = compile_model_impl(network, plugin, parsed._config, nullptr, hash, {}, forceDisableCache);
             }
         } else {
-            res = load_model_impl(network, plugin, parsed._config, nullptr, {}, {}, forceDisableCache);
+            res = compile_model_impl(network, plugin, parsed._config, nullptr, {}, {}, forceDisableCache);
         }
         return {{res._so}, res._ptr};
     }
@@ -509,13 +511,13 @@ public:
             res = LoadNetworkFromCache(cacheManager, hash, plugin, parsed._config, nullptr, loadedFromCache, modelPath);
             if (!loadedFromCache) {
                 auto cnnNetwork = ReadNetwork(modelPath, std::string());
-                res = load_model_impl(cnnNetwork, plugin, parsed._config, nullptr, hash, modelPath);
+                res = compile_model_impl(cnnNetwork, plugin, parsed._config, nullptr, hash, modelPath);
             }
         } else if (cacheManager) {
-            res = plugin.load_model(modelPath, parsed._config);
+            res = plugin.compile_model(modelPath, parsed._config);
         } else {
             auto cnnNetwork = ReadNetwork(modelPath, std::string());
-            res = load_model_impl(cnnNetwork, plugin, parsed._config, nullptr, {}, modelPath);
+            res = compile_model_impl(cnnNetwork, plugin, parsed._config, nullptr, {}, modelPath);
         }
         return {{res._so}, res._ptr};
     }
@@ -609,6 +611,8 @@ public:
                 devicesIDs = p.as<std::vector<std::string>>();
             } catch (ie::Exception&) {
                 // plugin is not created by e.g. invalid env
+            } catch (ov::Exception&) {
+                // plugin is not created by e.g. invalid env
             } catch (const std::exception& ex) {
                 IE_THROW() << "An exception is thrown while trying to create the " << deviceName
                            << " device and call GetMetric: " << ex.what();
@@ -695,7 +699,7 @@ public:
 
                 return result;
             } catch (const ie::Exception& ex) {
-                IE_THROW() << "Failed to create plugin " << FileUtils::fromFilePath(desc.libraryLocation)
+                IE_THROW() << "Failed to create plugin " << ov::util::from_file_path(desc.libraryLocation)
                            << " for device " << deviceName << "\n"
                            << "Please, check your environment\n"
                            << ex.what() << "\n";
@@ -736,11 +740,11 @@ public:
         }
 
         // append IR library path for default IE plugins
-        FileUtils::FilePath pluginPath;
+        ov::util::FilePath pluginPath;
         {
-            pluginPath = FileUtils::makePluginLibraryName({}, FileUtils::toFilePath(pluginName.c_str()));
+            pluginPath = FileUtils::makePluginLibraryName({}, ov::util::to_file_path(pluginName.c_str()));
 
-            FileUtils::FilePath absFilePath = FileUtils::makePath(ie::getInferenceEngineLibraryPath(), pluginPath);
+            ov::util::FilePath absFilePath = FileUtils::makePath(ie::getInferenceEngineLibraryPath(), pluginPath);
             if (FileUtils::fileExist(absFilePath))
                 pluginPath = absFilePath;
         }
@@ -980,7 +984,7 @@ std::map<std::string, Version> Core::GetVersions(const std::string& deviceName)
 #ifdef ENABLE_UNICODE_PATH_SUPPORT
 
 CNNNetwork Core::ReadNetwork(const std::wstring& modelPath, const std::wstring& binPath) const {
-    return ReadNetwork(FileUtils::wStringtoMBCSstringChar(modelPath), FileUtils::wStringtoMBCSstringChar(binPath));
+    return ReadNetwork(ov::util::wstring_to_string(modelPath), ov::util::wstring_to_string(binPath));
 }
 
 #endif
@@ -1220,66 +1224,82 @@ void Core::UnregisterPlugin(const std::string& deviceName_) {
 namespace ov {
 namespace runtime {
 
+#define OV_CORE_CALL_STATEMENT(...)                     \
+    try {                                               \
+        __VA_ARGS__;                                    \
+    } catch (const std::exception& ex) {                \
+        throw ov::Exception(ex.what());                 \
+    } catch (...) {                                     \
+        OPENVINO_ASSERT(false, "Unexpected exception"); \
+    }
+
 class Core::Impl : public CoreImpl {};
 
 Core::Core(const std::string& xmlConfigFile) {
     _impl = std::make_shared<Impl>();
 
-    register_plugins(parseXmlConfig(xmlConfigFile));
+    OV_CORE_CALL_STATEMENT(register_plugins(parseXmlConfig(xmlConfigFile)));
 }
 
 std::map<std::string, ie::Version> Core::get_versions(const std::string& deviceName) const {
-    return _impl->GetVersions(deviceName);
+    OV_CORE_CALL_STATEMENT(return _impl->GetVersions(deviceName))
 }
 
 #ifdef ENABLE_UNICODE_PATH_SUPPORT
 std::shared_ptr<ngraph::Function> Core::read_model(const std::wstring& modelPath, const std::wstring& binPath) const {
-    return _impl
-        ->ReadNetwork(FileUtils::wStringtoMBCSstringChar(modelPath), FileUtils::wStringtoMBCSstringChar(binPath))
-        .getFunction();
+    OV_CORE_CALL_STATEMENT(
+        return _impl->ReadNetwork(ov::util::wstring_to_string(modelPath), ov::util::wstring_to_string(binPath))
+            .getFunction(););
 }
 #endif
+
 std::shared_ptr<ngraph::Function> Core::read_model(const std::string& modelPath, const std::string& binPath) const {
-    return _impl->ReadNetwork(modelPath, binPath).getFunction();
+    OV_CORE_CALL_STATEMENT(return _impl->ReadNetwork(modelPath, binPath).getFunction(););
 }
+
 std::shared_ptr<ngraph::Function> Core::read_model(const std::string& model, const ie::Blob::CPtr& weights) const {
-    return _impl->ReadNetwork(model, weights).getFunction();
+    OV_CORE_CALL_STATEMENT(return _impl->ReadNetwork(model, weights).getFunction(););
 }
+
 ExecutableNetwork Core::compile_model(const std::shared_ptr<const ngraph::Function>& network,
                                       const std::string& deviceName,
                                       const ConfigMap& config) {
-    auto exec =
-        _impl->LoadNetwork(ie::CNNNetwork(std::const_pointer_cast<ngraph::Function>(network)), deviceName, config);
-    return {exec.operator const InferenceEngine::details::SharedObjectLoader&().get(),
-            exec.operator std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>&()};
+    OV_CORE_CALL_STATEMENT(
+        auto exec =
+            _impl->LoadNetwork(ie::CNNNetwork(std::const_pointer_cast<ngraph::Function>(network)), deviceName, config);
+        return {exec.operator const InferenceEngine::details::SharedObjectLoader&().get(),
+                exec.operator std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>&()};);
 }
+
 ExecutableNetwork Core::compile_model(const std::string& modelPath,
                                       const std::string& deviceName,
                                       const ConfigMap& config) {
-    auto exec = _impl->LoadNetwork(modelPath, deviceName, config);
-    return {exec.operator const InferenceEngine::details::SharedObjectLoader&().get(),
-            exec.operator std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>&()};
+    OV_CORE_CALL_STATEMENT(auto exec = _impl->LoadNetwork(modelPath, deviceName, config);
+                           return {exec.operator const InferenceEngine::details::SharedObjectLoader&().get(),
+                                   exec.operator std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>&()};);
 }
 
 ExecutableNetwork Core::compile_model(const std::shared_ptr<const ngraph::Function>& network,
                                       const RemoteContext& context,
                                       const ConfigMap& config) {
-    auto exec =
-        _impl->LoadNetwork(ie::CNNNetwork(std::const_pointer_cast<ngraph::Function>(network)), context._impl, config);
-    return {exec._so, exec._ptr};
+    OV_CORE_CALL_STATEMENT(auto exec =
+                               _impl->LoadNetwork(ie::CNNNetwork(std::const_pointer_cast<ngraph::Function>(network)),
+                                                  context._impl,
+                                                  config);
+                           return {exec._so, exec._ptr};);
 }
 
 void Core::add_extension(const ie::IExtensionPtr& extension) {
-    _impl->AddExtension(extension);
+    OV_CORE_CALL_STATEMENT(_impl->AddExtension(extension););
 }
 
 ExecutableNetwork Core::import_model(std::istream& networkModel,
                                      const std::string& deviceName,
                                      const ConfigMap& config) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::IE, "Core::import_model");
-    auto exec = _impl->ImportNetwork(networkModel, deviceName, config);
-    return {exec.operator const InferenceEngine::details::SharedObjectLoader&().get(),
-            exec.operator std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>&()};
+    OV_CORE_CALL_STATEMENT(auto exec = _impl->ImportNetwork(networkModel, deviceName, config);
+                           return {exec.operator const InferenceEngine::details::SharedObjectLoader&().get(),
+                                   exec.operator std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>&()};);
 }
 
 ExecutableNetwork Core::import_model(std::istream& networkModel,
@@ -1297,143 +1317,109 @@ ExecutableNetwork Core::import_model(std::istream& networkModel,
     if (exportMagic == magic) {
         std::getline(networkModel, deviceName);
     } else {
-        IE_THROW() << "Passed compiled stream does not contain device name. "
-                      "Please, provide device name manually";
+        OPENVINO_ASSERT(false,
+                        "Passed compiled stream does not contain device name. "
+                        "Please, provide device name manually");
     }
     networkModel.seekg(currentPos, networkModel.beg);
 
-    auto exec = _impl->GetCPPPluginByName(deviceName).import_model(networkModel, {});
-    return {exec._so, exec._ptr};
+    OV_CORE_CALL_STATEMENT(auto exec = _impl->GetCPPPluginByName(deviceName).import_model(networkModel, {});
+                           return {exec._so, exec._ptr};);
 }
 
 SupportedOpsMap Core::query_model(const std::shared_ptr<const ngraph::Function>& network,
                                   const std::string& deviceName,
                                   const ConfigMap& config) const {
-    auto cnnNet = ie::CNNNetwork(std::const_pointer_cast<ngraph::Function>(network));
-    auto qnResult = _impl->QueryNetwork(cnnNet, deviceName, config);
-    return qnResult.supportedLayersMap;
+    OV_CORE_CALL_STATEMENT(auto cnnNet = ie::CNNNetwork(std::const_pointer_cast<ngraph::Function>(network));
+                           auto qnResult = _impl->QueryNetwork(cnnNet, deviceName, config);
+                           return qnResult.supportedLayersMap;);
 }
 
 void Core::set_config(const ConfigMap& config, const std::string& deviceName) {
-    // HETERO case
-    if (deviceName.find("HETERO:") == 0) {
-        IE_THROW() << "SetConfig is supported only for HETERO itself (without devices). "
-                      "You can configure the devices with SetConfig before creating the HETERO on top.";
-    }
-
-    // MULTI case
-    if (deviceName.find("MULTI:") == 0) {
-        IE_THROW() << "SetConfig is supported only for MULTI itself (without devices). "
-                      "You can configure the devices with SetConfig before creating the MULTI on top.";
-    }
-
-    // AUTO case
-    if (deviceName.find("AUTO:") == 0) {
-        IE_THROW() << "SetConfig is supported only for AUTO itself (without devices). "
-                      "You can configure the devices with SetConfig before creating the AUTO on top.";
-    }
+    OPENVINO_ASSERT(deviceName.find("HETERO:") != 0,
+                    "set_config is supported only for HETERO itself (without devices). "
+                    "You can configure the devices with set_config before creating the HETERO on top.");
+    OPENVINO_ASSERT(deviceName.find("MULTI:") != 0,
+                    "set_config is supported only for MULTI itself (without devices). "
+                    "You can configure the devices with set_config before creating the MULTI on top.");
+    OPENVINO_ASSERT(deviceName.find("AUTO:") != 0,
+                    "set_config is supported only for AUTO itself (without devices). "
+                    "You can configure the devices with set_config before creating the AUTO on top.");
 
     // GPU.0, GPU.1 cases
-    if (deviceName.find(".") != std::string::npos) {
-        IE_THROW()
-            << "SetConfig is supported only for device family itself (without particular device .#). "
-               "You can pass .# as a particular device instance to QueryNetwork, LoadNetwork, ImportNetwork only";
-    }
+    OPENVINO_ASSERT(deviceName.find(".") == std::string::npos,
+                    "set_config is supported only for device family itself (without particular device .#). "
+                    "You can pass .# as a particular device instance to query_model, compile_model, import_model only");
 
-    if (deviceName.empty()) {
-        _impl->SetConfigForPlugins(config, std::string());
-    } else {
-        auto parsed = parseDeviceNameIntoConfig(deviceName, config);
-        _impl->SetConfigForPlugins(parsed._config, parsed._deviceName);
-    }
+    OV_CORE_CALL_STATEMENT(
+        if (deviceName.empty()) { _impl->SetConfigForPlugins(config, std::string()); } else {
+            auto parsed = parseDeviceNameIntoConfig(deviceName, config);
+            _impl->SetConfigForPlugins(parsed._config, parsed._deviceName);
+        });
 }
 
-ie::Parameter Core::get_config(const std::string& deviceName, const std::string& name) const {
-    // HETERO case
-    {
-        if (deviceName.find("HETERO:") == 0) {
-            IE_THROW() << "You can only GetConfig of the HETERO itself (without devices). "
-                          "GetConfig is also possible for the individual devices before creating the HETERO on top.";
-        }
-    }
-    // MULTI case
-    {
-        if (deviceName.find("MULTI:") == 0) {
-            IE_THROW() << "You can only GetConfig of the MULTI itself (without devices). "
-                          "GetConfig is also possible for the individual devices before creating the MULTI on top.";
-        }
-    }
-    // AUTO case
-    {
-        if (deviceName.find("AUTO:") == 0) {
-            IE_THROW() << "You can only GetConfig of the AUTO itself (without devices). "
-                          "GetConfig is also possible for the individual devices before creating the AUTO on top.";
-        }
-    }
+Parameter Core::get_config(const std::string& deviceName, const std::string& name) const {
+    OPENVINO_ASSERT(deviceName.find("HETERO:") != 0,
+                    "You can only get_config of the HETERO itself (without devices). "
+                    "get_config is also possible for the individual devices before creating the HETERO on top.");
+    OPENVINO_ASSERT(deviceName.find("MULTI:") != 0,
+                    "You can only get_config of the MULTI itself (without devices). "
+                    "get_config is also possible for the individual devices before creating the MULTI on top.");
+    OPENVINO_ASSERT(deviceName.find("AUTO:") != 0,
+                    "You can only get_config of the AUTO itself (without devices). "
+                    "get_config is also possible for the individual devices before creating the AUTO on top.");
 
-    auto parsed = parseDeviceNameIntoConfig(deviceName);
+    OV_CORE_CALL_STATEMENT(
+        auto parsed = parseDeviceNameIntoConfig(deviceName);
 
-    // we need to return a copy of Parameter object which is created on Core side,
-    // not in ie plugin side, which can be unloaded from Core in a parallel thread
-    // TODO: remove this WA after *-31417 is resolved
-    return copyParameterValue(_impl->GetCPPPluginByName(parsed._deviceName).get_config(name, parsed._config));
+        // we need to return a copy of Parameter object which is created on Core side,
+        // not in ie plugin side, which can be unloaded from Core in a parallel thread
+        // TODO: remove this WA after *-31417 is resolved
+        return copyParameterValue(_impl->GetCPPPluginByName(parsed._deviceName).get_config(name, parsed._config)););
 }
 
-ie::Parameter Core::get_metric(const std::string& deviceName, const std::string& name) const {
-    return _impl->GetMetric(deviceName, name);
+Parameter Core::get_metric(const std::string& deviceName, const std::string& name) const {
+    OV_CORE_CALL_STATEMENT(return _impl->GetMetric(deviceName, name););
 }
 
 std::vector<std::string> Core::get_available_devices() const {
-    return _impl->GetAvailableDevices();
+    OV_CORE_CALL_STATEMENT(return _impl->GetAvailableDevices(););
 }
 
 void Core::register_plugin(const std::string& pluginName, const std::string& deviceName) {
-    _impl->RegisterPluginByName(pluginName, deviceName);
+    OV_CORE_CALL_STATEMENT(_impl->RegisterPluginByName(pluginName, deviceName););
 }
 
 void Core::unload_plugin(const std::string& deviceName) {
-    ie::DeviceIDParser parser(deviceName);
-    std::string devName = parser.getDeviceName();
+    OV_CORE_CALL_STATEMENT(ie::DeviceIDParser parser(deviceName); std::string devName = parser.getDeviceName();
 
-    _impl->UnloadPluginByName(devName);
+                           _impl->UnloadPluginByName(devName););
 }
 
 void Core::register_plugins(const std::string& xmlConfigFile) {
-    _impl->RegisterPluginsInRegistry(xmlConfigFile);
+    OV_CORE_CALL_STATEMENT(_impl->RegisterPluginsInRegistry(xmlConfigFile););
 }
 
-RemoteContext Core::create_context(const std::string& deviceName, const ie::ParamMap& params) {
-    if (deviceName.find("HETERO") == 0) {
-        IE_THROW() << "HETERO device does not support remote context";
-    }
-    if (deviceName.find("MULTI") == 0) {
-        IE_THROW() << "MULTI device does not support remote context";
-    }
-    if (deviceName.find("AUTO") == 0) {
-        IE_THROW() << "AUTO device does not support remote context";
-    }
+RemoteContext Core::create_context(const std::string& deviceName, const ParamMap& params) {
+    OPENVINO_ASSERT(deviceName.find("HETERO") != 0, "HETERO device does not support remote context");
+    OPENVINO_ASSERT(deviceName.find("MULTI") != 0, "MULTI device does not support remote context");
+    OPENVINO_ASSERT(deviceName.find("AUTO") != 0, "AUTO device does not support remote context");
 
-    auto parsed = parseDeviceNameIntoConfig(deviceName, params);
-    auto remoteContext = _impl->GetCPPPluginByName(parsed._deviceName).create_context(parsed._config);
-    return {remoteContext._so, remoteContext._ptr};
+    OV_CORE_CALL_STATEMENT(auto parsed = parseDeviceNameIntoConfig(deviceName, params);
+                           auto remoteContext =
+                               _impl->GetCPPPluginByName(parsed._deviceName).create_context(parsed._config);
+                           return {remoteContext._so, remoteContext._ptr};);
 }
 
 RemoteContext Core::get_default_context(const std::string& deviceName) {
-    if (deviceName.find("HETERO") == 0) {
-        IE_THROW() << "HETERO device does not support remote context";
-    }
-    if (deviceName.find("MULTI") == 0) {
-        IE_THROW() << "MULTI device does not support remote context";
-    }
-    if (deviceName.find("AUTO") == 0) {
-        IE_THROW() << "AUTO device does not support remote context";
-    }
+    OPENVINO_ASSERT(deviceName.find("HETERO") != 0, "HETERO device does not support remote context");
+    OPENVINO_ASSERT(deviceName.find("MULTI") != 0, "MULTI device does not support remote context");
+    OPENVINO_ASSERT(deviceName.find("AUTO") != 0, "AUTO device does not support remote context");
 
-    auto parsed = parseDeviceNameIntoConfig(deviceName, ie::ParamMap());
-
-    auto remoteContext = _impl->GetCPPPluginByName(parsed._deviceName).get_default_context(parsed._config);
-
-    return {remoteContext._so, remoteContext._ptr};
+    OV_CORE_CALL_STATEMENT(auto parsed = parseDeviceNameIntoConfig(deviceName, ParamMap());
+                           auto remoteContext =
+                               _impl->GetCPPPluginByName(parsed._deviceName).get_default_context(parsed._config);
+                           return {remoteContext._so, remoteContext._ptr};);
 }
 
 }  // namespace runtime
diff --git a/inference-engine/src/inference_engine/src/ie_layouts.cpp b/inference-engine/src/inference_engine/src/ie_layouts.cpp
index 9cb98c67152..f9f906cc34f 100644
--- a/inference-engine/src/inference_engine/src/ie_layouts.cpp
+++ b/inference-engine/src/inference_engine/src/ie_layouts.cpp
@@ -495,3 +495,16 @@ TensorSlice make_roi_slice(const TensorDesc& origDesc, const ROI& roi) {
 TensorDesc InferenceEngine::make_roi_desc(const TensorDesc& origDesc, const ROI& roi, bool useOrigMemDesc) {
     return make_roi_desc(origDesc, make_roi_slice(origDesc, roi), useOrigMemDesc);
 }
+
+TensorDesc InferenceEngine::make_roi_desc(const TensorDesc& origDesc,
+                                          const std::vector<size_t>& begin,
+                                          const std::vector<size_t>& end,
+                                          bool useOrigMemDesc) {
+    IE_ASSERT(begin.size() == end.size());
+    TensorSlice slice;
+    for (size_t i = 0; i < begin.size(); ++i) {
+        IE_ASSERT(end[i] >= begin[i]);
+        slice.emplace_back(begin[i], end[i] - begin[i]);
+    }
+    return make_roi_desc(origDesc, slice, useOrigMemDesc);
+}
diff --git a/inference-engine/src/inference_engine/src/ie_network_reader.cpp b/inference-engine/src/inference_engine/src/ie_network_reader.cpp
index f9c796c93f1..2227d524e81 100644
--- a/inference-engine/src/inference_engine/src/ie_network_reader.cpp
+++ b/inference-engine/src/inference_engine/src/ie_network_reader.cpp
@@ -45,13 +45,13 @@ class Reader : public IReader {
 
     InferenceEngine::details::SOPointer<IReader> getReaderPtr() {
         std::call_once(readFlag, [&]() {
-            FileUtils::FilePath libraryName = FileUtils::toFilePath(location);
-            FileUtils::FilePath readersLibraryPath =
+            ov::util::FilePath libraryName = ov::util::to_file_path(location);
+            ov::util::FilePath readersLibraryPath =
                 FileUtils::makePluginLibraryName(getInferenceEngineLibraryPath(), libraryName);
 
             if (!FileUtils::fileExist(readersLibraryPath)) {
                 IE_THROW() << "Please, make sure that Inference Engine ONNX reader library "
-                           << FileUtils::fromFilePath(::FileUtils::makePluginLibraryName({}, libraryName)) << " is in "
+                           << ov::util::from_file_path(::FileUtils::makePluginLibraryName({}, libraryName)) << " is in "
                            << getIELibraryPath();
             }
             ptr = {readersLibraryPath};
@@ -111,8 +111,8 @@ void registerReaders() {
 
     // TODO: Read readers info from XML
     auto create_if_exists = [](const std::string name, const std::string library_name) {
-        FileUtils::FilePath libraryName = FileUtils::toFilePath(library_name);
-        FileUtils::FilePath readersLibraryPath =
+        ov::util::FilePath libraryName = ov::util::to_file_path(library_name);
+        ov::util::FilePath readersLibraryPath =
             FileUtils::makePluginLibraryName(getInferenceEngineLibraryPath(), libraryName);
 
         if (!FileUtils::fileExist(readersLibraryPath))
@@ -120,12 +120,6 @@ void registerReaders() {
         return std::make_shared<Reader>(name, library_name);
     };
 
-    // try to load IR reader v10 if library exists
-    auto irReaderv10 =
-        create_if_exists("IRv10", std::string("inference_engine_ir_reader") + std::string(IE_BUILD_POSTFIX));
-    if (irReaderv10)
-        readers.emplace("xml", irReaderv10);
-
     // try to load IR reader v7 if library exists
     auto irReaderv7 =
         create_if_exists("IRv7", std::string("inference_engine_ir_v7_reader") + std::string(IE_BUILD_POSTFIX));
@@ -155,6 +149,19 @@ void assertIfIRv7LikeModel(std::istream& modelStream) {
                   "version of the OpenVINO to generate supported IR version.";
 }
 
+ov::Extensions get_extensions_map(const std::vector<InferenceEngine::IExtensionPtr>& exts) {
+    ov::Extensions extensions;
+    for (const auto& ext : exts) {
+        for (const auto& item : ext->getOpSets()) {
+            if (extensions.count(item.first)) {
+                IE_THROW() << "Extension with " << item.first << " name already exists";
+            }
+            extensions[item.first] = item.second;
+        }
+    }
+    return extensions;
+}
+
 }  // namespace
 
 CNNNetwork details::ReadNetwork(const std::string& modelPath,
@@ -165,7 +172,7 @@ CNNNetwork details::ReadNetwork(const std::string& modelPath,
 
     // Fix unicode name
 #if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-    std::wstring model_path = FileUtils::multiByteCharToWString(modelPath.c_str());
+    std::wstring model_path = ov::util::string_to_wstring(modelPath.c_str());
 #else
     std::string model_path = modelPath;
 #endif
@@ -176,7 +183,7 @@ CNNNetwork details::ReadNetwork(const std::string& modelPath,
 
     assertIfIRv7LikeModel(modelStream);
 
-    // Find reader for model extension
+    // TODO: this code is needed only by V7 IR reader. So we need to remove it in future.
     auto fileExt = modelPath.substr(modelPath.find_last_of(".") + 1);
     for (auto it = readers.lower_bound(fileExt); it != readers.upper_bound(fileExt); it++) {
         auto reader = it->second;
@@ -201,7 +208,7 @@ CNNNetwork details::ReadNetwork(const std::string& modelPath,
             if (!bPath.empty()) {
                 // Open weights file
 #if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-                std::wstring weights_path = FileUtils::multiByteCharToWString(bPath.c_str());
+                std::wstring weights_path = ov::util::string_to_wstring(bPath.c_str());
 #else
                 std::string weights_path = bPath;
 #endif
@@ -232,24 +239,30 @@ CNNNetwork details::ReadNetwork(const std::string& modelPath,
             return reader->read(modelStream, exts);
         }
     }
+
     // Try to load with FrontEndManager
     auto& manager = get_frontend_manager();
     ngraph::frontend::FrontEnd::Ptr FE;
     ngraph::frontend::InputModel::Ptr inputModel;
+
+    ov::VariantVector params{ov::make_variant(model_path)};
+    if (!exts.empty()) {
+        params.emplace_back(ov::make_variant(get_extensions_map(exts)));
+    }
+
     if (!binPath.empty()) {
 #if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-        std::wstring weights_path = FileUtils::multiByteCharToWString(binPath.c_str());
+        const std::wstring& weights_path = ov::util::string_to_wstring(binPath.c_str());
 #else
-        std::string weights_path = binPath;
+        const std::string& weights_path = binPath;
 #endif
-        FE = manager.load_by_model(model_path, weights_path);
-        if (FE)
-            inputModel = FE->load(model_path, weights_path);
-    } else {
-        FE = manager.load_by_model(model_path);
-        if (FE)
-            inputModel = FE->load(model_path);
+        params.emplace_back(ov::make_variant(weights_path));
     }
+
+    FE = manager.load_by_model(params);
+    if (FE)
+        inputModel = FE->load(params);
+
     if (inputModel) {
         auto ngFunc = FE->convert(inputModel);
         return CNNNetwork(ngFunc, exts);
@@ -277,14 +290,26 @@ CNNNetwork details::ReadNetwork(const std::string& model,
             return reader->read(modelStream, exts);
         }
     }
+
     // Try to load with FrontEndManager
-    // NOTE: weights argument is ignored
     auto& manager = get_frontend_manager();
     ngraph::frontend::FrontEnd::Ptr FE;
     ngraph::frontend::InputModel::Ptr inputModel;
-    FE = manager.load_by_model(&modelStream);
+
+    ov::VariantVector params{ov::make_variant(&modelStream)};
+    if (weights) {
+        char* data = weights->cbuffer().as<char*>();
+        ov::Weights weights_buffer =
+            std::make_shared<ngraph::runtime::SharedBuffer<Blob::CPtr>>(data, weights->byteSize(), weights);
+        params.emplace_back(ov::make_variant(weights_buffer));
+    }
+    if (!exts.empty()) {
+        params.emplace_back(ov::make_variant(get_extensions_map(exts)));
+    }
+
+    FE = manager.load_by_model(params);
     if (FE)
-        inputModel = FE->load(&modelStream);
+        inputModel = FE->load(params);
     if (inputModel) {
         auto ngFunc = FE->convert(inputModel);
         return CNNNetwork(ngFunc, exts);
diff --git a/inference-engine/src/inference_engine/src/os/lin/lin_shared_object_loader.cpp b/inference-engine/src/inference_engine/src/os/lin/lin_shared_object_loader.cpp
index cf1d6c0af28..052bbfbb1fe 100644
--- a/inference-engine/src/inference_engine/src/os/lin/lin_shared_object_loader.cpp
+++ b/inference-engine/src/inference_engine/src/os/lin/lin_shared_object_loader.cpp
@@ -8,6 +8,7 @@
 
 #include "details/ie_so_loader.h"
 #include "file_utils.h"
+#include "openvino/util/file_util.hpp"
 #include "shared_object.hpp"
 
 namespace ov {
@@ -28,7 +29,7 @@ std::shared_ptr<void> load_shared_object(const char* path) {
 
 #ifdef ENABLE_UNICODE_PATH_SUPPORT
 std::shared_ptr<void> load_shared_object(const wchar_t* path) {
-    return load_shared_object(FileUtils::wStringtoMBCSstringChar(path).c_str());
+    return load_shared_object(ov::util::wstring_to_string(path).c_str());
 }
 #endif  // ENABLE_UNICODE_PATH_SUPPORT
 
@@ -57,7 +58,7 @@ struct SharedObjectLoader::Impl {
     explicit Impl(const char* pluginName) : shared_object{ov::runtime::load_shared_object(pluginName)} {}
 
 #ifdef ENABLE_UNICODE_PATH_SUPPORT
-    explicit Impl(const wchar_t* pluginName) : Impl(FileUtils::wStringtoMBCSstringChar(pluginName).c_str()) {}
+    explicit Impl(const wchar_t* pluginName) : Impl(ov::util::wstring_to_string(pluginName).c_str()) {}
 #endif  // ENABLE_UNICODE_PATH_SUPPORT
 
     void* get_symbol(const char* symbolName) const {
@@ -93,4 +94,4 @@ std::shared_ptr<void> SharedObjectLoader::get() const {
 }
 
 }  // namespace details
-}  // namespace InferenceEngine
\ No newline at end of file
+}  // namespace InferenceEngine
diff --git a/inference-engine/src/inference_engine/src/os/win/win_shared_object_loader.cpp b/inference-engine/src/inference_engine/src/os/win/win_shared_object_loader.cpp
index 525ab076094..5e36e2f04cf 100644
--- a/inference-engine/src/inference_engine/src/os/win/win_shared_object_loader.cpp
+++ b/inference-engine/src/inference_engine/src/os/win/win_shared_object_loader.cpp
@@ -159,7 +159,7 @@ std::shared_ptr<void> load_shared_object(const wchar_t* path) {
     }
     if (!shared_object) {
         char cwd[1024];
-        IE_THROW() << "Cannot load library '" << FileUtils::wStringtoMBCSstringChar(std::wstring(path)) << "': " << GetLastError()
+        IE_THROW() << "Cannot load library '" << ov::util::wstring_to_string(std::wstring(path)) << "': " << GetLastError()
                             << " from cwd: " << _getcwd(cwd, sizeof(cwd));
     }
     return {shared_object,
diff --git a/inference-engine/src/low_precision_transformations/include/low_precision/layer_transformation.hpp b/inference-engine/src/low_precision_transformations/include/low_precision/layer_transformation.hpp
index 40807928305..c0e72fd8ce2 100644
--- a/inference-engine/src/low_precision_transformations/include/low_precision/layer_transformation.hpp
+++ b/inference-engine/src/low_precision_transformations/include/low_precision/layer_transformation.hpp
@@ -57,52 +57,81 @@ public:
             hasZeroPoint(hasZeroPoint) {}
 
     static bool isSupported(const element::Type& precision) {
-        return (precision == element::u8) || (precision == element::i8);
+        static const std::set<element::Type_t> lowPrecision = {
+                element::i8, element::u8,
+                element::i16, element::u16,
+                element::i32, element::u32
+        };
+        return lowPrecision.count(precision) == 1;
     }
 
     static float getMinValue(const element::Type precision, const size_t levels) {
-        if (precision == element::i8) {
-            if (levels == 255) {
-                return static_cast<float>(std::numeric_limits<signed char>::lowest()) + 1.f;
-            } else if (levels == 256) {
-                return static_cast<float>(std::numeric_limits<signed char>::lowest());
-            } else {
-                NGRAPH_CHECK(false, "unexpected levels ", levels, " for precision ", precision);
-            }
-        } else if (precision == element::u8) {
-            return static_cast<float>(std::numeric_limits<unsigned char>::lowest());
-        } else if (precision == element::f16) {
-            return -1.0e15f;
-        } else if (precision == element::f32) {
-            return std::numeric_limits<float>::lowest();
-        } else if (precision == element::i4) {
-            return -8.f;
-        } else if (precision == element::u4) {
-            return 0.f;
-        } else {
-            NGRAPH_CHECK(false, "unexpected precision ", precision);
+        switch (precision) {
+            case element::u4:
+            case element::u8:
+            case element::u16:
+            case element::u32:
+                return 0.f;
+            case element::i4:
+                return -8.f;
+            case element::i8:
+                switch (levels) {
+                    case 255:
+                        return -127.f;
+                    case 256:
+                        return -128.f;
+                }
+                break;
+            case element::i16:
+                switch (levels) {
+                    case 65536:
+                        return -32768.f;
+                    case 65535:
+                        return -32767.f;
+                }
+                break;
+            case element::i32:
+                switch (levels) {
+                    case static_cast<size_t>(4294967296):
+                        return -2147483648.f;
+                    case 4294967295:
+                        return -2147483647.f;
+                }
+                break;
+            case element::f16:
+                return -1.0e15f;
+            case element::f32:
+                return std::numeric_limits<float>::lowest();
+            default:
+                NGRAPH_CHECK(false, "unexpected precision ", precision);
         }
+        NGRAPH_CHECK(false, "unexpected levels ", levels, " for precision ", precision);
     }
 
     static float getMaxValue(const element::Type precision, const size_t levels) {
-        if ((levels != 255ul) && (levels != 256ul)) {
-            THROW_TRANSFORMATION_EXCEPTION << "unexpected levels " << levels;
-        }
-
-        if (precision == element::i8) {
-            return static_cast<float>(std::numeric_limits<signed char>::max());
-        } else if (precision == element::u8) {
-            return static_cast<float>(std::numeric_limits<unsigned char>::max()) - (256 - levels);
-        } else if (precision == element::f16) {
-            return 1.0e15f;
-        } else if (precision == element::f32) {
-            return std::numeric_limits<float>::max();
-        } else if (precision == element::i4) {
-            return 7.f;
-        } else if (precision == element::u4) {
-            return 15.f;
-        } else {
-            THROW_TRANSFORMATION_EXCEPTION << "unexpected precision " << precision;
+        switch (precision) {
+            case element::u4:
+                return 15.f;
+            case element::u8:
+                return 255.f;
+            case element::u16:
+                return 65535.f;
+            case element::u32:
+                return 4294967296.f;
+            case element::i4:
+                return 7.f;
+            case element::i8:
+                return 127.f;
+            case element::i16:
+                return 32767.f;
+            case element::i32:
+                return 2147483647.f;
+            case element::f16:
+                return 1.0e15f;
+            case element::f32:
+                return std::numeric_limits<float>::max();
+            default:
+                NGRAPH_CHECK(false, "unexpected precision ", precision);
         }
     }
 
diff --git a/inference-engine/src/low_precision_transformations/include/low_precision/low_precision.hpp b/inference-engine/src/low_precision_transformations/include/low_precision/low_precision.hpp
index 454ebebfda3..a75224ea797 100644
--- a/inference-engine/src/low_precision_transformations/include/low_precision/low_precision.hpp
+++ b/inference-engine/src/low_precision_transformations/include/low_precision/low_precision.hpp
@@ -65,6 +65,8 @@ public:
     bool run_on_function(std::shared_ptr<ngraph::Function> f) override;
 
     static bool isFunctionQuantized(const std::shared_ptr<const ngraph::Function>& function);
+    static bool isFQLevelsPresent(const std::shared_ptr<const ngraph::Function>& function, const std::set<size_t>& levels);
+    static void setDefaultPrecisions(const std::vector<element::Type>& precisions);
 
 protected:
     std::vector<OperationPrecisionRestriction> precisionRestrictions;
diff --git a/inference-engine/src/low_precision_transformations/include/low_precision/rt_info/precisions_attribute.hpp b/inference-engine/src/low_precision_transformations/include/low_precision/rt_info/precisions_attribute.hpp
index 329ee2cb22e..65d0a50ea25 100644
--- a/inference-engine/src/low_precision_transformations/include/low_precision/rt_info/precisions_attribute.hpp
+++ b/inference-engine/src/low_precision_transformations/include/low_precision/rt_info/precisions_attribute.hpp
@@ -31,7 +31,7 @@ using PrecisionsAttributePtr = std::shared_ptr<PrecisionsAttribute>;
 
 class LP_TRANSFORMATIONS_API PrecisionsAttribute : public SharedValueAttribute<PrecisionsSharedValue> {
 public:
-    static const std::vector<ngraph::element::Type> defaultPrecisions;
+    static std::vector<ngraph::element::Type> defaultPrecisions;
     PrecisionsAttribute(const std::vector<ngraph::element::Type>& precisions = defaultPrecisions);
 };
 } // namespace ngraph
diff --git a/inference-engine/src/low_precision_transformations/src/fake_quantize_decomposition.cpp b/inference-engine/src/low_precision_transformations/src/fake_quantize_decomposition.cpp
index fda2858f6df..6149fb3599f 100644
--- a/inference-engine/src/low_precision_transformations/src/fake_quantize_decomposition.cpp
+++ b/inference-engine/src/low_precision_transformations/src/fake_quantize_decomposition.cpp
@@ -118,18 +118,32 @@ DataPrecision getDataPrecisionByOutputPort(std::shared_ptr<opset1::FakeQuantize>
     }
 
     const auto& precisions = precisionsAttribute->get()->sharedValue->precisions;
+    std::vector<element::Type> precisionsForLevels{};
+    switch (levels) {
+        case 65536:
+        case 65535:
+            precisionsForLevels = {element::u16, element::i16};
+            break;
+        case static_cast<size_t>(4294967296):
+        case 4294967295:
+            precisionsForLevels = {element::u32, element::i32};
+            break;
+        default:
+            precisionsForLevels = {element::u8, element::i8};
+    }
+    const auto resultPrecisions = NetworkHelper::precisionIntersection(precisions, precisionsForLevels);
 
     ngraph::element::Type precision;
     bool hasZeroPoint;
-    if (precisions.size() > 1ul) {
+    if (resultPrecisions.size() > 1ul) {
         LayerTransformation::PrecisionDetails precisionDetailsAtOutputIntervals = LayerTransformation::getPrecisionDetails(
             levels,
             outputLowValues,
             outputHighValues);
-        const auto foundIt = std::find(precisions.begin(), precisions.end(), precisionDetailsAtOutputIntervals.precision);
+        const auto foundIt = std::find(resultPrecisions.begin(), resultPrecisions.end(), precisionDetailsAtOutputIntervals.precision);
 
-        if (foundIt == precisions.end()) {
-            precision = *precisions.begin();
+        if (foundIt == resultPrecisions.end()) {
+            precision = *resultPrecisions.begin();
             hasZeroPoint = true;
         } else {
             precision = precisionDetailsAtOutputIntervals.precision;
@@ -140,7 +154,7 @@ DataPrecision getDataPrecisionByOutputPort(std::shared_ptr<opset1::FakeQuantize>
         precisionsAttribute->get()->sharedValue->precisions = { precision };
     } else {
         // use only available precision
-        precision = *precisions.begin();
+        precision = *resultPrecisions.begin();
         LayerTransformation::PrecisionDetails precisionDetailsAtOutputIntervals = LayerTransformation::getPrecisionDetails(
             levels,
             outputLowValues,
diff --git a/inference-engine/src/low_precision_transformations/src/fake_quantize_dequantization.cpp b/inference-engine/src/low_precision_transformations/src/fake_quantize_dequantization.cpp
index aecd9c072ae..52e651b6ca0 100644
--- a/inference-engine/src/low_precision_transformations/src/fake_quantize_dequantization.cpp
+++ b/inference-engine/src/low_precision_transformations/src/fake_quantize_dequantization.cpp
@@ -6,6 +6,7 @@
 #include <memory>
 
 #include <ngraph/opsets/opset1.hpp>
+#include <low_precision/network_helper.hpp>
 
 #include "low_precision/common/fake_quantize_dequantization.hpp"
 #include "low_precision/common/ie_lpt_exception.hpp"
@@ -71,7 +72,7 @@ bool FakeQuantizeDequantization::isShared() const {
 }
 
 bool FakeQuantizeDequantization::isLowPrecision() const {
-    return (data.get_element_type() == element::i8) || (data.get_element_type() == element::u8);
+    return DataPrecision::isSupported(data.get_element_type());
 }
 
 bool FakeQuantizeDequantization::checkShape(const std::shared_ptr<ngraph::Node>& elementwise) noexcept {
@@ -165,9 +166,13 @@ int FakeQuantizeDequantization::fillDequantizationParams(
         std::shared_ptr<ngraph::opset1::Constant>& constant) {
         convert = ov::as_type_ptr<opset1::Convert>(elementwise->get_input_node_shared_ptr(branchIndex));
         if (convert != nullptr) {
-            constant = ov::as_type_ptr<opset1::Constant>(convert->get_input_node_shared_ptr(0));
+            constant = convert->get_destination_type().is_real() ?
+                ov::as_type_ptr<opset1::Constant>(convert->get_input_node_shared_ptr(0)) :
+                nullptr;
         } else {
-            constant = ov::as_type_ptr<opset1::Constant>(elementwise->get_input_node_shared_ptr(branchIndex));
+            constant = elementwise->get_input_element_type(branchIndex).is_real() ?
+                ov::as_type_ptr<opset1::Constant>(elementwise->get_input_node_shared_ptr(branchIndex)) :
+                nullptr;
         }
     };
 
@@ -187,12 +192,18 @@ int FakeQuantizeDequantization::fillDequantizationParams(
 int FakeQuantizeDequantization::fillDequantizationParams(
     const std::shared_ptr<ngraph::Node>& elementwise,
     std::shared_ptr<ngraph::opset1::Constant>& constant) noexcept {
-    constant = ov::as_type_ptr<opset1::Constant>(elementwise->get_input_node_shared_ptr(1ul));
+    constant = elementwise->get_input_element_type(1ul).is_real() ?
+        ov::as_type_ptr<opset1::Constant>(elementwise->get_input_node_shared_ptr(1ul)) :
+        nullptr;
+
     if (constant != nullptr) {
         return 1;
     }
 
-    constant = ov::as_type_ptr<opset1::Constant>(elementwise->get_input_node_shared_ptr(0ul));
+    constant = elementwise->get_input_element_type(0ul).is_real() ?
+        ov::as_type_ptr<opset1::Constant>(elementwise->get_input_node_shared_ptr(0ul)) :
+        nullptr;
+
     if (constant != nullptr) {
         return 0;
     }
diff --git a/inference-engine/src/low_precision_transformations/src/layer_transformation.cpp b/inference-engine/src/low_precision_transformations/src/layer_transformation.cpp
index 72c08bb5c78..0f0e766cbf6 100644
--- a/inference-engine/src/low_precision_transformations/src/layer_transformation.cpp
+++ b/inference-engine/src/low_precision_transformations/src/layer_transformation.cpp
@@ -202,7 +202,7 @@ LayerTransformation::PrecisionDetails LayerTransformation::getPrecisionDetails(
     const float zeroThreshold = 1.e-6f;
     const float quantizationIntervalAsymmetryThreshold = 0.002f;
 
-    const float asymmetricIntervalSideRatio256 = -128.f / 127.f;
+    float asymmetricIntervalSideRatio = -static_cast<float>(quantizationLevels) / (quantizationLevels - 2.f);
     bool hasNegative = false;
     bool signedPrecision = true;
     bool unsignedPrecision = true;
@@ -217,7 +217,8 @@ LayerTransformation::PrecisionDetails LayerTransformation::getPrecisionDetails(
             hasNegative = true;
 
             if (outputHighValues[i] != 0.f) {
-                const float expectedRatio = quantizationLevels == 256 ? asymmetricIntervalSideRatio256 : -1.f;
+                const float expectedRatio = (quantizationLevels == 256 || quantizationLevels == 65536 || quantizationLevels == 4294967296) ?
+                                            asymmetricIntervalSideRatio : -1.f;
                 const float actualRatio = outputLowValues[i] / outputHighValues[i];
                 const float actual = std::fabs((actualRatio - expectedRatio) / std::min(actualRatio, expectedRatio));
                 if (actual > quantizationIntervalAsymmetryThreshold) {
@@ -262,17 +263,44 @@ LayerTransformation::PrecisionDetails LayerTransformation::getPrecisionDetails(
 //
 //    THROW_TRANSFORMATION_EXCEPTION << "unexpected interval";
 
+    element::Type resultPrecision = element::undefined;
     if (!hasZeroPoint) {
         if (signedPrecision && (!unsignedPrecision)) {
-            return LayerTransformation::PrecisionDetails(element::i8, hasNegative, hasZeroPoint);
+            switch (quantizationLevels) {
+                case 256:
+                case 255:
+                    resultPrecision = element::i8;
+                    break;
+                case 65536:
+                case 65535:
+                    resultPrecision = element::i16;
+                    break;
+                case static_cast<size_t>(4294967296):
+                case 4294967295:
+                    resultPrecision = element::i32;
+                    break;
+            }
         }
 
         if ((!signedPrecision) && unsignedPrecision) {
-            return LayerTransformation::PrecisionDetails(element::u8, hasNegative, hasZeroPoint);
+            switch (quantizationLevels) {
+                case 256:
+                case 255:
+                    resultPrecision = element::u8;
+                    break;
+                case 65536:
+                case 65535:
+                    resultPrecision = element::u16;
+                    break;
+                case static_cast<size_t>(4294967296):
+                case 4294967295:
+                    resultPrecision = element::u32;
+                    break;
+            }
         }
     }
 
-    return LayerTransformation::PrecisionDetails(element::undefined, hasNegative, hasZeroPoint);
+    return LayerTransformation::PrecisionDetails(resultPrecision, hasNegative, hasZeroPoint);
 }
 
 LayerTransformation::PrecisionDetails LayerTransformation::getPrecisionDetails(const QuantizationDetails& quantizationDetails) {
@@ -296,6 +324,22 @@ DataPrecision LayerTransformation::getDataPrecision(
 #ifdef LPT_PRINT_DEQUANTIZATION_INFO
     printDequantizationInfo(layer);
 #endif
+    std::vector<element::Type> resultPrecisions = precisions;
+    std::vector<element::Type> FQPrecisions;
+    switch (quantizationDetails.levels) {
+        case 255:
+        case 256:
+            FQPrecisions = {element::u8, element::i8};
+            break;
+        case 65535:
+        case 65536:
+            FQPrecisions = {element::u16, element::i16};
+            break;
+        case 4294967295:
+        case static_cast<size_t>(4294967296):
+            FQPrecisions = {element::u32, element::i32};
+    }
+    resultPrecisions = NetworkHelper::precisionIntersection(precisions, FQPrecisions);
     PrecisionDetails precisionDetailsAtOutputIntervals = getPrecisionDetails(quantizationDetails);
 
     if (precisionDetailsAtOutputIntervals.precision != element::undefined) {
diff --git a/inference-engine/src/low_precision_transformations/src/low_precision.cpp b/inference-engine/src/low_precision_transformations/src/low_precision.cpp
index 936ba903ce0..164a90cddfa 100644
--- a/inference-engine/src/low_precision_transformations/src/low_precision.cpp
+++ b/inference-engine/src/low_precision_transformations/src/low_precision.cpp
@@ -29,6 +29,7 @@
 #include "low_precision/fold_convert.hpp"
 #include "low_precision/pull_reshape_through_dequantization.hpp"
 #include "low_precision/pull_transpose_through_dequantization.hpp"
+#include "low_precision/rt_info/precisions_attribute.hpp"
 
 // branch specific transformations
 #include "low_precision/concat.hpp"
@@ -283,3 +284,24 @@ bool ngraph::pass::low_precision::LowPrecision::isFunctionQuantized(const std::s
     }
     return false;
 }
+
+bool ngraph::pass::low_precision::LowPrecision::isFQLevelsPresent(
+        const std::shared_ptr<const ngraph::Function>& function,
+        const std::set<size_t>& levels) {
+    std::vector<std::shared_ptr<ngraph::Node>> nodes = function->get_ops();
+    for (auto& node : nodes) {
+        for (size_t i = 0; i < node->inputs().size(); ++i) {
+            const auto fakeQuantize = as_type_ptr<ngraph::opset1::FakeQuantize>(node);
+            if (fakeQuantize != nullptr) {
+                if (levels.count(fakeQuantize->get_levels()) == 1) {
+                    return true;
+                }
+            }
+        }
+    }
+    return false;
+}
+
+void ngraph::pass::low_precision::LowPrecision::setDefaultPrecisions(const std::vector<element::Type>& precisions) {
+    ngraph::PrecisionsAttribute::defaultPrecisions = precisions;
+}
diff --git a/inference-engine/src/low_precision_transformations/src/move_fake_quantize.cpp b/inference-engine/src/low_precision_transformations/src/move_fake_quantize.cpp
index 7192282c2d2..a64d6c66f79 100644
--- a/inference-engine/src/low_precision_transformations/src/move_fake_quantize.cpp
+++ b/inference-engine/src/low_precision_transformations/src/move_fake_quantize.cpp
@@ -39,12 +39,26 @@ MoveFakeQuantize::MoveFakeQuantize(const Params& params) : LayerTransformation(p
         output_low,
         output_high });
 
-    ngraph::graph_rewrite_callback callback = [this](pattern::Matcher& m) {
+    ngraph::graph_rewrite_callback callback = [=](pattern::Matcher& m) {
         auto op = m.get_match_root();
         if (transformation_callback(op)) {
             return false;
         }
 
+        // workaround: only per-tensor quantization is allowed
+        const auto& pattern_map = m.get_pattern_value_map();
+        const auto is_scalar = [&](const std::shared_ptr<ngraph::Node>& wrapped_constant) {
+            return NetworkHelper::isScalarLike(
+                    as_type_ptr<opset1::Constant>(pattern_map.at(wrapped_constant).get_node_shared_ptr()));
+        };
+
+        if (!is_scalar(input_low) ||
+            !is_scalar(input_high) ||
+            !is_scalar(output_low) ||
+            !is_scalar(output_high)) {
+            return false;
+        }
+
         return transform(*context, m);
     };
 
diff --git a/inference-engine/src/low_precision_transformations/src/network_helper.cpp b/inference-engine/src/low_precision_transformations/src/network_helper.cpp
index c45e80e0b27..6d38a1ba5f8 100644
--- a/inference-engine/src/low_precision_transformations/src/network_helper.cpp
+++ b/inference-engine/src/low_precision_transformations/src/network_helper.cpp
@@ -969,17 +969,38 @@ std::tuple<std::shared_ptr<Node>, std::shared_ptr<Node>> NetworkHelper::decompos
     std::vector<float> shifts(outputSize, 0.f);
     std::vector<float> scales(outputSize);
 
-    for (size_t i = 0; i < outputSize; ++i) {
-        if (outputHighValues[i] != outputLowValues[i]) {
-            shifts[i] = (min*outputHighValues[i] - max*outputLowValues[i]) / (outputHighValues[i] - outputLowValues[i]);
-            scales[i] = (outputHighValues[i] - outputLowValues[i]) / (max - min);
-            if (shifts[i] == -0.f) {
-                shifts[i] = 0.f;
+    // compute dequantizations (in double for INT32)
+    if (precision == element::i32 || precision == element::u32) {
+        for (size_t i = 0; i < outputSize; ++i) {
+            if (outputHighValues[i] != outputLowValues[i]) {
+                shifts[i] = static_cast<float>(
+                            (static_cast<double>(min) * outputHighValues[i] - static_cast<double>(max) * outputLowValues[i]) /
+                            (static_cast<double>(outputHighValues[i]) - outputLowValues[i]));
+                scales[i] = static_cast<float>(
+                        (static_cast<double>(outputHighValues[i]) - outputLowValues[i]) / (static_cast<double>(max) - min));
+                if (shifts[i] == -0.f) {
+                    shifts[i] = 0.f;
+                }
+            } else {
+                scales[i] = outputHighValues[i];
+                minValues[i] = 1.f;
+                maxValues[i] = 1.f;
+            }
+        }
+    } else {
+        for (size_t i = 0; i < outputSize; ++i) {
+            if (outputHighValues[i] != outputLowValues[i]) {
+                shifts[i] = (min * outputHighValues[i] - max * outputLowValues[i]) /
+                            (outputHighValues[i] - outputLowValues[i]);
+                scales[i] = (outputHighValues[i] - outputLowValues[i]) / (max - min);
+                if (shifts[i] == -0.f) {
+                    shifts[i] = 0.f;
+                }
+            } else {
+                scales[i] = outputHighValues[i];
+                minValues[i] = 1.f;
+                maxValues[i] = 1.f;
             }
-        } else {
-            scales[i] = outputHighValues[i];
-            minValues[i] = 1.f;
-            maxValues[i] = 1.f;
         }
     }
 
@@ -1759,15 +1780,15 @@ std::vector<element::Type> NetworkHelper::precisionIntersection(
         const std::vector<element::Type>& v2) noexcept {
     std::vector<element::Type> v3;
 
-    auto v1Copy = v1;
-    auto v2Copy = v2;
+    for (auto i : v1) {
+        for (auto j : v2) {
+            if (i == j) {
+                v3.push_back(i);
+                break;
+            }
+        }
+    }
 
-    std::sort(v1Copy.begin(), v1Copy.end());
-    std::sort(v2Copy.begin(), v2Copy.end());
-
-    std::set_intersection(v1Copy.begin(), v1Copy.end(),
-                          v2Copy.begin(), v2Copy.end(),
-                          std::back_inserter(v3));
     return v3;
 }
 
diff --git a/inference-engine/src/low_precision_transformations/src/quantization_details.cpp b/inference-engine/src/low_precision_transformations/src/quantization_details.cpp
index 79486394a2f..84028c99a15 100644
--- a/inference-engine/src/low_precision_transformations/src/quantization_details.cpp
+++ b/inference-engine/src/low_precision_transformations/src/quantization_details.cpp
@@ -154,7 +154,7 @@ std::vector<float> QuantizationDetails::getBlobValue(std::shared_ptr<Node> const
 }
 
 bool QuantizationDetails::isSupportedLevel(const size_t level) {
-    static const std::unordered_set<size_t> supported_levels = { 255ul, 256ul };
+    static const std::unordered_set<size_t> supported_levels = { 255, 256, 65536, 65535, static_cast<size_t>(4294967296), 4294967295 };
     return supported_levels.find(level) != supported_levels.end();
 }
 
diff --git a/inference-engine/src/low_precision_transformations/src/rt_info/precisions_attribute.cpp b/inference-engine/src/low_precision_transformations/src/rt_info/precisions_attribute.cpp
index 3344f4f74a7..2cc92e68e21 100644
--- a/inference-engine/src/low_precision_transformations/src/rt_info/precisions_attribute.cpp
+++ b/inference-engine/src/low_precision_transformations/src/rt_info/precisions_attribute.cpp
@@ -17,7 +17,7 @@ using namespace ngraph;
 using namespace ov;
 
 // order defines default precision
-const std::vector<ngraph::element::Type> PrecisionsAttribute::defaultPrecisions = { ngraph::element::u8, ngraph::element::i8 };
+std::vector<ngraph::element::Type> PrecisionsAttribute::defaultPrecisions = {ngraph::element::u8,  ngraph::element::i8};
 
 PrecisionsAttribute::PrecisionsAttribute(const std::vector<ngraph::element::Type>& precisions) {
     sharedValue->precisions = precisions;
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.cpp
index 1209cc3f162..14fe27a187d 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.cpp
@@ -13,11 +13,11 @@
 #include "mkldnn_serialize.h"
 #include "nodes/mkldnn_memory_node.hpp"
 #include <threading/ie_executor_manager.hpp>
-#if ((IE_THREAD == IE_THREAD_TBB) || (IE_THREAD == IE_THREAD_TBB_AUTO))
+#define FIX_62820 0
+#if FIX_62820 && ((IE_THREAD == IE_THREAD_TBB) || (IE_THREAD == IE_THREAD_TBB_AUTO))
 #include <threading/ie_tbb_streams_executor.hpp>
-#else
-#include <threading/ie_cpu_streams_executor.hpp>
 #endif
+#include <threading/ie_cpu_streams_executor.hpp>
 #include <ie_system_conf.h>
 #include <algorithm>
 #include <unordered_set>
@@ -73,14 +73,14 @@ MKLDNNExecNetwork::MKLDNNExecNetwork(const InferenceEngine::CNNNetwork &network,
     } else {
         auto streamsExecutorConfig = InferenceEngine::IStreamsExecutor::Config::MakeDefaultMultiThreaded(_cfg.streamExecutorConfig, isFloatModel);
         streamsExecutorConfig._name = "CPUStreamsExecutor";
-#if (IE_THREAD == IE_THREAD_TBB || IE_THREAD == IE_THREAD_TBB_AUTO)
+#if FIX_62820 && (IE_THREAD == IE_THREAD_TBB || IE_THREAD == IE_THREAD_TBB_AUTO)
         _taskExecutor = std::make_shared<TBBStreamsExecutor>(streamsExecutorConfig);
 #else
         _taskExecutor = ExecutorManager::getInstance()->getIdleCPUStreamsExecutor(streamsExecutorConfig);
 #endif
     }
     if (0 != cfg.streamExecutorConfig._streams) {
-#if (IE_THREAD == IE_THREAD_TBB || IE_THREAD == IE_THREAD_TBB_AUTO)
+#if FIX_62820 && (IE_THREAD == IE_THREAD_TBB || IE_THREAD == IE_THREAD_TBB_AUTO)
         // There is no additional threads but we still need serialize callback execution to preserve legacy behaviour
         _callbackExecutor = std::make_shared<ImmediateSerialExecutor>();
 #else
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_graph.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_graph.cpp
index a2c1c9818ea..4bb7253c3a1 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_graph.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_graph.cpp
@@ -317,6 +317,7 @@ void MKLDNNGraph::Replicate(const CNNNetwork &network, const MKLDNNExtensionMana
 
 void MKLDNNGraph::InitGraph() {
     MKLDNNGraphOptimizer optimizer;
+    ENABLE_CPU_DEBUG_CAP(initNodeDumper(config.debugCaps));
 
     SortTopologically();
     InitNodes();
@@ -398,19 +399,19 @@ void MKLDNNGraph::ExtractConstantNodes() {
     }
 }
 
-void MKLDNNGraph::ExecuteConstantNodesOnly() {
+void MKLDNNGraph::ExecuteConstantNodesOnly() const {
     OV_ITT_SCOPE(FIRST_INFERENCE, itt::domains::MKLDNN_LT, "MKLDNNGraph::ExecuteConstantNodesOnly");
     mkldnn::stream stream(eng);
 
     using shared_memory_ptr = MKLDNNWeightsSharing::MKLDNNSharedMemory::Ptr;
 
-    auto acquireSharedOutputs = [this](MKLDNNNodePtr & graphNode) {
+    auto acquireSharedOutputs = [this](const MKLDNNNodePtr & node) {
         std::vector<shared_memory_ptr> outputs;
         bool hasLocalAllocatedEdges = false;
         bool hasExternalInvalidEdges = false;
 
-        for (size_t i = 0; i < graphNode->getChildEdges().size(); ++i) {
-            auto edgePtr = graphNode->getChildEdgeAt(i);
+        for (size_t i = 0; i < node->getChildEdges().size(); ++i) {
+            auto edgePtr = node->getChildEdgeAt(i);
             if (edgePtr) {
                 if (edgePtr->isUseExternalMemory()) {
                     auto ptr = weightsCache->get(edgePtr->name());
@@ -426,18 +427,18 @@ void MKLDNNGraph::ExecuteConstantNodesOnly() {
         return std::make_tuple(hasExternalInvalidEdges, hasLocalAllocatedEdges, outputs);
     };
 
-    for (auto &graphNode : constantGraphNodes) {
+    for (const auto &node : constantGraphNodes) {
         if (weightsCache) {
-            auto sharedOutputs = acquireSharedOutputs(graphNode);
+            auto sharedOutputs = acquireSharedOutputs(node);
 
             if (std::get<0>(sharedOutputs) || std::get<1>(sharedOutputs)) {
-                graphNode->execute(stream);
+                ExecuteNode(node, stream);
 
                 for (auto & output : std::get<2>(sharedOutputs))
                     output->valid(true);
             }
         } else {
-            graphNode->execute(stream);
+            ExecuteNode(node, stream);
         }
     }
 }
@@ -809,6 +810,16 @@ void MKLDNNGraph::PullOutputData(BlobMap &out) {
     }
 }
 
+inline void MKLDNNGraph::ExecuteNode(const MKLDNNNodePtr& node, const mkldnn::stream& stream) const {
+    DUMP(node, infer_count);
+    OV_ITT_SCOPED_TASK(itt::domains::MKLDNNPlugin, node->profiling.execute);
+
+    if (node->isDynamicNode())
+        node->executeDynamic(stream);
+    else
+        node->execute(stream);
+}
+
 void MKLDNNGraph::Infer(MKLDNNInferRequest* request, int batch) {
     if (!IsReady()) {
         IE_THROW() << "Wrong state. Topology is not ready.";
@@ -816,33 +827,12 @@ void MKLDNNGraph::Infer(MKLDNNInferRequest* request, int batch) {
 
     mkldnn::stream stream(eng);
 
-    ENABLE_CPU_DEBUG_CAP(NodeDumper nd(config.debugCaps, infer_count));
-
-#ifdef CPU_DEBUG_CAPS
-    for (const auto& node : constantGraphNodes) {
-        if (request != nullptr)
-            request->ThrowIfCanceled();
-
-        ENABLE_CPU_DEBUG_CAP(nd.dumpInputBlobs(node));
-        ENABLE_CPU_DEBUG_CAP(nd.dumpOutputBlobs(node));
-    }
-#endif
-
     for (const auto& node : mutableGraphNodes) {
         PERF(config.collectPerfCounters, node);
-        if (request != nullptr)
+        if (request)
             request->ThrowIfCanceled();
 
-        ENABLE_CPU_DEBUG_CAP(nd.dumpInputBlobs(node));
-
-        OV_ITT_SCOPED_TASK(itt::domains::MKLDNNPlugin, node->profiling.execute);
-        if (node->isDynamicNode()) {
-            node->executeDynamic(stream);
-        } else {
-            node->execute(stream);
-        }
-
-        ENABLE_CPU_DEBUG_CAP(nd.dumpOutputBlobs(node));
+        ExecuteNode(node, stream);
     }
 
     if (infer_count != -1) infer_count++;
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_graph.h b/inference-engine/src/mkldnn_plugin/mkldnn_graph.h
index 4d587b4afd5..cc87acd3eaf 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_graph.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_graph.h
@@ -236,7 +236,8 @@ protected:
     void AllocateWithReuse();
     void CreatePrimitives();
     void ExtractConstantNodes();
-    void ExecuteConstantNodesOnly();
+    void ExecuteNode(const MKLDNNNodePtr& node, const mkldnn::stream& stream) const;
+    void ExecuteConstantNodesOnly() const;
 
     friend class MKLDNNInferRequest;
     friend class MKLDNNGraphlessInferRequest;
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_plugin.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_plugin.cpp
index 5bb831e3407..51545c66526 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_plugin.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_plugin.cpp
@@ -369,8 +369,25 @@ static void TransformationUpToCPUSpecificOpSet(std::shared_ptr<ngraph::Function>
             OperationPerTensorQuantizationRestriction::create<ngraph::opset1::ConvolutionBackpropData>({0})
         });
 
+        // for GNA networks reference execution
+        bool updatePrecision = true;
+        bool hasINT16orINT32Levels = ngraph::pass::low_precision::LowPrecision::isFQLevelsPresent(
+                nGraphFunc,
+                {65535, 65536, 4294967295, 4294967296});
+        if (hasINT16orINT32Levels) {
+            updatePrecision = false;
+            LowPrecision::setDefaultPrecisions({
+                ngraph::element::u8,  ngraph::element::i8,
+                ngraph::element::u16, ngraph::element::i16,
+                ngraph::element::u32, ngraph::element::i32,
+            });
+
+            supportedPrecisions = std::vector<OperationPrecisionRestriction>({});
+        }
+
         ngraph::pass::Manager lptManager;
-        lptManager.register_pass<ngraph::pass::low_precision::LowPrecision>(supportedPrecisions, perTensorQuantization);
+        lptManager.register_pass<ngraph::pass::low_precision::LowPrecision>(supportedPrecisions, perTensorQuantization,
+                                                                            LayerTransformation::Params(updatePrecision));
         lptManager.get_pass_config()->set_callback<ngraph::pass::low_precision::MarkupPrecisions>([](const_node_ptr& node) -> bool {
             if (const auto mulitply = std::dynamic_pointer_cast<const ngraph::opset1::Multiply>(node)) {
                 return !MultiplyToGroupConvolutionTransformation::canBeTransformedToGroupConvolution(mulitply);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.cpp
index 4567d115489..e1b9edfaf11 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.cpp
@@ -39,6 +39,9 @@ MKLDNNBucketizeNode::MKLDNNBucketizeNode(const std::shared_ptr<ngraph::Node>& op
 
     errorPrefix = "Bucketize layer with name '" + op->get_friendly_name() + "' ";
     const auto bucketsize = std::dynamic_pointer_cast<const ngraph::opset3::Bucketize>(op);
+    if (bucketsize == nullptr)
+        IE_THROW() << "Operation with name '" << op->get_friendly_name() <<
+            "' is not an instance of Bucketize from opset3.";
 
     if (getOriginalInputsNumber() != 2 || getOriginalOutputsNumber() != 1) {
         IE_THROW() << errorPrefix << " has incorrect number of input/output edges!";
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.cpp
index 542ca78f3ea..5b764d6ce0c 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.cpp
@@ -52,6 +52,10 @@ MKLDNNCumSumNode::MKLDNNCumSumNode(const std::shared_ptr<ngraph::Node>& op, cons
     numOfDims = dataShape.size();
 
     const auto cumsum = std::dynamic_pointer_cast<const ngraph::opset3::CumSum>(op);
+    if (cumsum == nullptr)
+        IE_THROW() << "Operation with name '" << op->get_friendly_name() <<
+            "' is not an instance of CumSum from opset3.";
+
     exclusive = cumsum->is_exclusive();
     reverse = cumsum->is_reverse();
 
@@ -254,7 +258,7 @@ inline size_t MKLDNNCumSumNode::getStartOffset(const std::vector<size_t> &forSta
 size_t MKLDNNCumSumNode::getAxis(const MKLDNNMemory& _axis, const MKLDNNMemory& _data) const {
     const auto& axisPrecision = _axis.getDesc().getPrecision();
     const int64_t dataShapeSize = static_cast<int64_t>(_data.GetShape().getRank());
-    int64_t axisValueFromBlob;
+    int64_t axisValueFromBlob = 0;
     switch (axisPrecision) {
         case Precision::I32 : {
             const auto *axisPtr = reinterpret_cast<const int32_t *>(_axis.GetPtr());
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_def_conv_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_def_conv_node.cpp
index 603d479ebdd..840ffe479e6 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_def_conv_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_def_conv_node.cpp
@@ -766,6 +766,9 @@ MKLDNNDeformableConvolutionNode::MKLDNNDeformableConvolutionNode(const std::shar
         IE_THROW(NotImplemented) << errorMessage;
     }
     auto defConvNodeBase = std::dynamic_pointer_cast<ngraph::op::util::DeformableConvolutionBase>(op);
+    if (defConvNodeBase == nullptr)
+        IE_THROW() << "Operation with name '" << op->get_friendly_name() <<
+            "' is not an instance of DeformableConvolutionBase.";
 
     group = defConvNodeBase->get_group();
     deformable_group = defConvNodeBase->get_deformable_group();
@@ -783,6 +786,9 @@ MKLDNNDeformableConvolutionNode::MKLDNNDeformableConvolutionNode(const std::shar
 
     if (op->get_type_info() == ngraph::op::v8::DeformableConvolution::type_info) {
         auto defConvNode = std::dynamic_pointer_cast<ngraph::op::v8::DeformableConvolution>(op);
+        if (defConvNode == nullptr)
+            IE_THROW() << "Operation with name '" << op->get_friendly_name() <<
+                "' is not an instance of DeformableConvolution from opset8.";
         with_bilinear_pad = defConvNode->get_bilinear_interpolation_pad();
     } else {
         with_bilinear_pad = false;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.cpp
index 84992e52cad..17a8caadbfb 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.cpp
@@ -104,7 +104,7 @@ void pre_calc_for_bilinear_interpolate(
                     T hy = static_cast<T>(1) - ly, hx = static_cast<T>(1) - lx;
                     T w1 = hy * hx, w2 = hy * lx, w3 = ly * hx, w4 = ly * lx;
 
-                    // save weights and indeces
+                    // save weights and indices
                     PreCalc<T> pc;
                     pc.pos1 = y_low * width + x_low;
                     pc.pos2 = y_low * width + x_high;
@@ -175,7 +175,7 @@ void ROIAlignForward_cpu_kernel(
         // We do average (integral) pooling inside a bin
         const T count = static_cast<T>(roi_bin_grid_h * roi_bin_grid_w);  // e.g. = 4
 
-        // we want to precalculate indeces and weights shared by all chanels,
+        // we want to precalculate indices and weights shared by all chanels,
         // this is the key point of optimiation
         std::vector<PreCalc<T>> pre_calc(
                 roi_bin_grid_h * roi_bin_grid_w * pooled_width * pooled_height);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.cpp
index 6cf84aac94f..e62ea4af504 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.cpp
@@ -40,6 +40,10 @@ MKLDNNExperimentalDetectronTopKROIsNode::MKLDNNExperimentalDetectronTopKROIsNode
 
     errorPrefix = "ExperimentalDetectronTopKROIs layer with name '" + op->get_friendly_name() + "'";
     const auto topKROI = std::dynamic_pointer_cast<const ngraph::opset6::ExperimentalDetectronTopKROIs>(op);
+    if (topKROI == nullptr)
+        IE_THROW() << "Operation with name '" << op->get_friendly_name() <<
+            "' is not an instance of ExperimentalDetectronTopKROIs from opset6.";
+
     if (getOriginalInputsNumber() != 2 || getOriginalOutputsNumber() != 1)
         IE_THROW() << errorPrefix << " has incorrect number of input/output edges!";
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fake_quantize_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fake_quantize_node.cpp
index a0acfc5c7b3..e28f749264e 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fake_quantize_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fake_quantize_node.cpp
@@ -26,6 +26,9 @@
 // Quantization ranges validation is switched off by default in order to avoid regressions on user side
 // #define VALIDATE_QUANTIZATION_RANGES
 
+// Uncomment it to compute scales and shifts in double precision
+// #define FQ_DOUBLE_PRECISION
+
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
@@ -1060,9 +1063,13 @@ MKLDNNFakeQuantizeNode::MKLDNNFakeQuantizeNode(const std::shared_ptr<ngraph::Nod
                                    << "inputLow = " << il << ", inputHigh = " << ih;
             }
 #endif
-
+#ifdef FQ_DOUBLE_PRECISION
+                inputScale[i] = (levels - 1.0) / (static_cast<double>(ih) - il);
+                inputShift[i] = -il * (levels - 1.0) / (static_cast<double>(ih) - il);
+#else
                 inputScale[i] = (levels - 1) / (ih - il);
                 inputShift[i] = -il * (levels - 1) / (ih - il);
+#endif
             }
 
             for (int i = 0; i < outputScale.size(); i++) {
@@ -1075,8 +1082,11 @@ MKLDNNFakeQuantizeNode::MKLDNNFakeQuantizeNode(const std::shared_ptr<ngraph::Nod
                                        << "outputLow = " << ol << ", outputHigh = " << oh;
                 }
 #endif
-
+#ifdef FQ_DOUBLE_PRECISION
+                outputScale[i] = (static_cast<double>(oh) - ol) / (levels - 1.0);
+#else
                 outputScale[i] = (oh - ol) / (levels - 1);
+#endif
 
                 if (outputScale[i] != 1.f)
                     quantizationOnly = false;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.cpp
index d7da220de72..b6583033520 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.cpp
@@ -37,6 +37,9 @@ MKLDNNGRNNode::MKLDNNGRNNode(const std::shared_ptr<ngraph::Node>& op, const mkld
 
     errorPrefix = "GRN layer with name '" + op->get_friendly_name() + "'";
     const auto grn = std::dynamic_pointer_cast<const ngraph::opset1::GRN>(op);
+    if (grn == nullptr)
+        IE_THROW() << "Operation with name '" << op->get_friendly_name() <<
+            "' is not an instance of GRN from opset1.";
 
     if (getOriginalInputsNumber() != 1 || getOriginalOutputsNumber() != 1)
         IE_THROW() << errorPrefix << " has incorrect number of input/output edges!";
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.cpp
index b85c15b7023..3efe3f69cbe 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.cpp
@@ -37,6 +37,9 @@ MKLDNNLogSoftmaxNode::MKLDNNLogSoftmaxNode(const std::shared_ptr<ngraph::Node>&
 
     errorPrefix = "LogSoftmax layer with name '" + op->get_friendly_name() + "'";
     const auto logSoftMax = std::dynamic_pointer_cast<const ngraph::opset5::LogSoftmax>(op);
+    if (logSoftMax == nullptr)
+        IE_THROW() << "Operation with name '" << op->get_friendly_name() <<
+            "' is not an instance of LogSoftmax from opset5.";
 
     if (getOriginalInputsNumber() != 1 || getOriginalOutputsNumber() != 1)
         IE_THROW() << errorPrefix << " has incorrect number of input/output edges!";
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.cpp
index 25f912b4f38..9dbf344ca84 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.cpp
@@ -38,6 +38,9 @@ MKLDNNReverseSequenceNode::MKLDNNReverseSequenceNode(const std::shared_ptr<ngrap
 
     errorPrefix = "ReverseSequence layer with name '" + op->get_friendly_name() + "'";
     const auto revSeq = std::dynamic_pointer_cast<const ngraph::opset1::ReverseSequence>(op);
+    if (revSeq == nullptr)
+        IE_THROW() << "Operation with name '" << op->get_friendly_name() <<
+            "' is not an instance of ReverseSequence from opset1.";
 
     if (getOriginalInputsNumber() != 2 || getOriginalOutputsNumber() != 1)
         IE_THROW() << errorPrefix << " has incorrect number of input/output edges!";
diff --git a/inference-engine/src/mkldnn_plugin/utils/node_dumper.cpp b/inference-engine/src/mkldnn_plugin/utils/node_dumper.cpp
index 256a55a7710..02a36f166c9 100644
--- a/inference-engine/src/mkldnn_plugin/utils/node_dumper.cpp
+++ b/inference-engine/src/mkldnn_plugin/utils/node_dumper.cpp
@@ -20,10 +20,9 @@ using namespace InferenceEngine;
 
 namespace MKLDNNPlugin {
 
-NodeDumper::NodeDumper(const DebugCaps::Config& config, const int _count)
+NodeDumper::NodeDumper(const DebugCaps::Config& config)
     : dumpFormat(FORMAT::BIN)
-    , dumpDirName("mkldnn_dump")
-    , count(_count) {
+    , dumpDirName("mkldnn_dump") {
     if (!config.blobDumpDir.empty())
         dumpDirName = config.blobDumpDir;
 
@@ -43,7 +42,7 @@ NodeDumper::NodeDumper(const DebugCaps::Config& config, const int _count)
         dumpFilters[FILTER::BY_NAME] = config.blobDumpNodeName;
 }
 
-void NodeDumper::dumpInputBlobs(const MKLDNNNodePtr& node) const {
+void NodeDumper::dumpInputBlobs(const MKLDNNNodePtr& node, int count) const {
     if (!shouldBeDumped(node, "IN"))
         return;
 
@@ -77,7 +76,7 @@ void NodeDumper::dumpInputBlobs(const MKLDNNNodePtr& node) const {
     dumpInternalBlobs(node);
 }
 
-void NodeDumper::dumpOutputBlobs(const MKLDNNNodePtr& node) const {
+void NodeDumper::dumpOutputBlobs(const MKLDNNNodePtr& node, int count) const {
     if (!shouldBeDumped(node, "OUT"))
         return;
 
@@ -210,5 +209,16 @@ void NodeDumper::formatNodeName(std::string& name) const {
     std::replace(name.begin(), name.end(), ':', '-');
 }
 
+std::unique_ptr<NodeDumper> nd;
+
+void initNodeDumper(const DebugCaps::Config& config) {
+    nd.reset(new NodeDumper(config));
+}
+
+const std::unique_ptr<NodeDumper>& getNodeDumper() {
+    assert(nd.get() != nullptr);
+    return nd;
+}
+
 } // namespace MKLDNNPlugin
 #endif // CPU_DEBUG_CAPS
diff --git a/inference-engine/src/mkldnn_plugin/utils/node_dumper.h b/inference-engine/src/mkldnn_plugin/utils/node_dumper.h
index bac237c8883..7f349a07cfe 100644
--- a/inference-engine/src/mkldnn_plugin/utils/node_dumper.h
+++ b/inference-engine/src/mkldnn_plugin/utils/node_dumper.h
@@ -23,10 +23,10 @@ namespace MKLDNNPlugin {
  */
 class NodeDumper {
 public:
-    NodeDumper(const DebugCaps::Config& config, const int _count);
+    NodeDumper(const DebugCaps::Config& config);
 
-    void dumpInputBlobs(const MKLDNNNodePtr &node) const;
-    void dumpOutputBlobs(const MKLDNNNodePtr &node) const;
+    void dumpInputBlobs(const MKLDNNNodePtr &node, int count = -1) const;
+    void dumpOutputBlobs(const MKLDNNNodePtr &node, int count = -1) const;
 
 private:
     void dumpInternalBlobs(const MKLDNNNodePtr& node) const;
@@ -55,5 +55,26 @@ private:
     // std::hash<int> is necessary for Ubuntu-16.04 (gcc-5.4 and defect in C++11 standart)
     std::unordered_map<FILTER, std::string, std::hash<int>> dumpFilters;
 };
+
+void initNodeDumper(const DebugCaps::Config& config);
+const std::unique_ptr<NodeDumper>& getNodeDumper();
+
+class DumpHelper {
+    const MKLDNNNodePtr& node;
+    const int count;
+
+public:
+    explicit DumpHelper(const MKLDNNNodePtr& _node, int _count = -1): node(_node), count(_count) {
+        getNodeDumper()->dumpInputBlobs(node, count);
+    }
+
+    ~DumpHelper() {
+        getNodeDumper()->dumpOutputBlobs(node, count);
+    }
+};
+
+#define DUMP(...) DumpHelper __helper##__node (__VA_ARGS__);
 } // namespace MKLDNNPlugin
+#else // CPU_DEBUG_CAPS
+#define DUMP(...)
 #endif // CPU_DEBUG_CAPS
diff --git a/inference-engine/src/multi_device/multi_device_exec_network.cpp b/inference-engine/src/multi_device/multi_device_exec_network.cpp
index b569a0cf40d..3a2a3673e14 100644
--- a/inference-engine/src/multi_device/multi_device_exec_network.cpp
+++ b/inference-engine/src/multi_device/multi_device_exec_network.cpp
@@ -11,16 +11,46 @@
 #include <map>
 #include <unordered_map>
 
-
+#include "ie_icore.hpp"
 #include "ie_metric_helpers.hpp"
 #include <ie_plugin_config.hpp>
 #include "multi_device_exec_network.hpp"
 #include "multi_device_async_infer_request.hpp"
 #include "multi_device_plugin.hpp"
 
+#include "ngraph/opsets/opset1.hpp"
+#include "ngraph_ops/convolution_ie.hpp"
+#include "ngraph_ops/deconvolution_ie.hpp"
+#include "transformations/utils/utils.hpp"
+
 // ------------------------------MultiDeviceExecutableNetwork----------------------------
 namespace MultiDevicePlugin {
-    using namespace InferenceEngine;
+using namespace InferenceEngine;
+
+namespace {
+std::string GetNetworkPrecision(const InferenceEngine::CNNNetwork &network) {
+    auto nGraphFunc = network.getFunction();
+    bool isINTModel = ngraph::op::util::has_op_with_type<ngraph::op::FakeQuantize>(nGraphFunc);
+    if (isINTModel) {
+        return METRIC_VALUE(INT8);
+    }
+    for (auto & node : nGraphFunc->get_ordered_ops()) {
+        if (std::dynamic_pointer_cast<ngraph::opset1::Convolution>(node) ||
+            std::dynamic_pointer_cast<ngraph::opset1::GroupConvolution>(node) ||
+            std::dynamic_pointer_cast<ngraph::opset1::GroupConvolutionBackpropData>(node) ||
+            std::dynamic_pointer_cast<ngraph::opset1::ConvolutionBackpropData>(node) ||
+            std::dynamic_pointer_cast<ngraph::op::ConvolutionIE>(node) ||
+            std::dynamic_pointer_cast<ngraph::op::DeconvolutionIE>(node)) {
+            auto layerType = node->input(1).get_element_type().get_type_name();
+            if (layerType == "f32")
+                return METRIC_VALUE(FP32);
+            if (layerType == "f16")
+                return METRIC_VALUE(FP16);
+        }
+    }
+    return METRIC_VALUE(FP32);
+}
+}  // namespace
 
 thread_local MultiDeviceExecutableNetwork::WorkerInferRequest* MultiDeviceExecutableNetwork::_thisWorkerInferRequest = nullptr;
 // TODO: revert to the plain variable (see header file), when we moved to the next CentOS 8.x in our support matrix
@@ -60,74 +90,215 @@ MultiDeviceExecutableNetwork::MultiDeviceExecutableNetwork(const DeviceMap<Infer
     for (auto&& networkValue : _networksPerDevice) {
         auto& device  = networkValue.first;
         auto& network = networkValue.second;
-
-        auto itNumRequests = std::find_if(_devicePriorities.cbegin(), _devicePriorities.cend(),
-                [&device](const DeviceInformation& d){ return d.deviceName == device;});
-        unsigned int optimalNum = 0;
-        try {
-            optimalNum = network->GetMetric(METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS)).as<unsigned int>();
-        } catch (const InferenceEngine::Exception &iie) {
-            IE_THROW()
-                    << "Every device used with the Multi-Device should "
-                    << "support OPTIMAL_NUMBER_OF_INFER_REQUESTS ExecutableNetwork metric. "
-                    << "Failed to query the metric for the " << device << " with error:" << iie.what();
-        }
-        const auto numRequests = (_devicePriorities.end() == itNumRequests ||
-            itNumRequests->numRequestsPerDevices == -1) ? optimalNum : itNumRequests->numRequestsPerDevices;
-        auto& workerRequests = _workerRequests[device];
-        auto& idleWorkerRequests = _idleWorkerRequests[device];
-        workerRequests.resize(numRequests);
-        _inferPipelineTasksDeviceSpecific[device] = std::unique_ptr<ThreadSafeQueue<Task>>(new ThreadSafeQueue<Task>);
-        auto* idleWorkerRequestsPtr = &(idleWorkerRequests);
-        idleWorkerRequests.set_capacity(numRequests);
-        for (auto&& workerRequest : workerRequests) {
-            workerRequest._inferRequest = { network, network->CreateInferRequest() };
-            auto* workerRequestPtr = &workerRequest;
-            IE_ASSERT(idleWorkerRequests.try_push(workerRequestPtr) == true);
-            workerRequest._inferRequest->SetCallback(
-                [workerRequestPtr, this, device, idleWorkerRequestsPtr] (std::exception_ptr exceptionPtr) mutable {
-                    IdleGuard idleGuard{workerRequestPtr, *idleWorkerRequestsPtr};
-                    workerRequestPtr->_exceptionPtr = exceptionPtr;
-                    {
-                        auto capturedTask = std::move(workerRequestPtr->_task);
-                        capturedTask();
-                    }
-                    // try to return the request to the idle list (fails if the overall object destruction has began)
-                    if (idleGuard.Release()->try_push(workerRequestPtr)) {
-                        // let's try to pop a task, as we know there is at least one idle request, schedule if succeeded
-                        // if no device-agnostic tasks, let's try pop the device specific task, schedule if succeeded
-                        Task t;
-                        if (_inferPipelineTasks.try_pop(t))
-                            ScheduleToWorkerInferRequest(std::move(t));
-                        else if (_inferPipelineTasksDeviceSpecific[device]->try_pop(t))
-                            ScheduleToWorkerInferRequest(std::move(t), device);
-                    }
-                });
-        }
+        GenerateWorkers(device, network);
     }
 }
 
+void MultiDeviceExecutableNetwork::GenerateWorkers(const std::string& device, const SoExecutableNetworkInternal& executableNetwork) {
+    auto itNumRequests = std::find_if(_devicePriorities.cbegin(), _devicePriorities.cend(),
+                                      [&device](const DeviceInformation& d){ return d.deviceName == device;});
+    unsigned int optimalNum = 0;
+    try {
+        optimalNum = executableNetwork->GetMetric(METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS)).as<unsigned int>();
+    } catch (const InferenceEngine::Exception &iie) {
+        IE_THROW()
+            << "Every device used with the Multi-Device should "
+            << "support OPTIMAL_NUMBER_OF_INFER_REQUESTS ExecutableNetwork metric. "
+            << "Failed to query the metric for the " << device << " with error:" << iie.what();
+    }
+    const auto numRequests = (_devicePriorities.end() == itNumRequests ||
+                              itNumRequests->numRequestsPerDevices == -1) ? optimalNum : itNumRequests->numRequestsPerDevices;
+    auto& workerRequests = _workerRequests[device];
+    auto& idleWorkerRequests = _idleWorkerRequests[device];
+    workerRequests.resize(numRequests);
+    _inferPipelineTasksDeviceSpecific[device] = std::unique_ptr<ThreadSafeQueue<Task>>(new ThreadSafeQueue<Task>);
+    auto* idleWorkerRequestsPtr = &(idleWorkerRequests);
+    idleWorkerRequests.set_capacity(numRequests);
+    for (auto&& workerRequest : workerRequests) {
+        workerRequest._inferRequest = { executableNetwork, executableNetwork->CreateInferRequest() };
+        auto* workerRequestPtr = &workerRequest;
+        IE_ASSERT(idleWorkerRequests.try_push(workerRequestPtr) == true);
+        workerRequest._inferRequest->SetCallback(
+            [workerRequestPtr, this, device, idleWorkerRequestsPtr] (std::exception_ptr exceptionPtr) mutable {
+                IdleGuard idleGuard{workerRequestPtr, *idleWorkerRequestsPtr};
+                workerRequestPtr->_exceptionPtr = exceptionPtr;
+                {
+                    auto capturedTask = std::move(workerRequestPtr->_task);
+                    capturedTask();
+                }
+                // try to return the request to the idle list (fails if the overall object destruction has began)
+                if (idleGuard.Release()->try_push(workerRequestPtr)) {
+                    // let's try to pop a task, as we know there is at least one idle request, schedule if succeeded
+                    // if no device-agnostic tasks, let's try pop the device specific task, schedule if succeeded
+                    Task t;
+                    if (_inferPipelineTasks.try_pop(t))
+                        ScheduleToWorkerInferRequest(std::move(t));
+                    else if (_inferPipelineTasksDeviceSpecific[device]->try_pop(t))
+                        ScheduleToWorkerInferRequest(std::move(t), device);
+                }
+            });
+    }
+}
+
+MultiDeviceExecutableNetwork::MultiDeviceExecutableNetwork(const std::string&                         modelPath,
+                                                           const InferenceEngine::CNNNetwork&         network,
+                                                           const std::vector<DeviceInformation>&      metaDevices,
+                                                           const std::string&                         strDevices,
+                                                           MultiDeviceInferencePlugin*                plugin,
+                                                           const bool                                needPerfCounters)
+                                                           : _devicePriorities{metaDevices}
+                                                           , _devicePrioritiesInitial{metaDevices}
+                                                           , _needPerfCounters(needPerfCounters)
+                                                           , _multiPlugin(plugin)
+                                                           , _workModeIsAUTO(true) {
+    if (_multiPlugin->GetCore() == nullptr) {
+        IE_THROW() << "Please, work with MULTI device via InferencEngine::Core object";
+    }
+
+    if (modelPath.empty() && network.getFunction() == nullptr) {
+        IE_THROW() << "MULTI device supports just ngraph network representation";
+    }
+
+    _core = _multiPlugin->GetCore(); // shared_ptr that holds the Core
+    _config[MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES] = strDevices;
+
+    std::vector<DeviceInformation> needLoadDevices;
+
+    // check if have cpu device
+    const auto CPUIter = std::find_if(metaDevices.begin(), metaDevices.end(),
+                                      [=](const DeviceInformation& d)->bool{return d.deviceName.find("CPU") != std::string::npos;});
+    if (CPUIter != metaDevices.end()) {
+        _cpuDevice = *CPUIter;
+        _config.insert(_cpuDevice.config.begin(), _cpuDevice.config.end());
+        needLoadDevices.push_back(_cpuDevice);
+        _cpuFuture = _cpuPromise.get_future();
+    }
+
+    // get accelerator device, like GPU
+    auto networkPrecision = GetNetworkPrecision(network);
+    _acceleratorDevice = _multiPlugin->SelectDevice(metaDevices, networkPrecision);
+    bool isAccelerator =
+        _acceleratorDevice.deviceName.find("CPU") == std::string::npos;
+    if (isAccelerator) {
+        _config.insert(_acceleratorDevice.config.begin(), _acceleratorDevice.config.end());
+        needLoadDevices.push_back(_acceleratorDevice);
+        _acceleratorFuture = _acceleratorPromise.get_future();
+    }
+
+    if (needLoadDevices.size() == 0) {
+        IE_THROW() << "No device set";
+    }
+
+    // will not wait for loading accelerator network,
+    // so the executor can't be destroyed before finished the task,
+    // so use executor as a member of MultiDeviceExecutableNetwork.
+    _executor = InferenceEngine::ExecutorManager::getInstance()->getIdleCPUStreamsExecutor(
+            IStreamsExecutor::Config{"AutoDeviceAsyncLoad",
+            static_cast<int>(std::thread::hardware_concurrency()) /* max possible #streams*/,
+            1 /*single thread per stream*/,
+            IStreamsExecutor::ThreadBindingType::NONE});
+
+    for (auto& p : needLoadDevices) {
+        // initialize these containers firstly to avoid insert operation in threads
+        _idleWorkerRequests[p.deviceName];
+        _workerRequests[p.deviceName];
+        _inferPipelineTasksDeviceSpecific[p.deviceName] = NULL;
+        const auto device = p.deviceName;
+        const auto deviceConfig = p.config;
+        // will not wait for loading accelerator network,
+        // so some parameters need to be transferred by value.
+       _executor->run([&, modelPath, network, device, deviceConfig]() {
+            SoExecutableNetworkInternal executableNetwork;
+            if (!modelPath.empty()) {
+                executableNetwork = _core->LoadNetwork(modelPath, device, deviceConfig);
+            } else {
+                executableNetwork = _core->LoadNetwork(network, device, deviceConfig);
+            }
+
+            GenerateWorkers(device, executableNetwork);
+
+            if (device.find("CPU") == std::string::npos) {
+                _alreadyActualNetwork = true;
+                _acceleratorPromise.set_value(executableNetwork);
+            } else {
+                _cpuPromise.set_value(executableNetwork);
+            }
+        });
+    }
+
+    WaitFirstNetworkReady();
+}
+
+void MultiDeviceExecutableNetwork::WaitFirstNetworkReady() {
+    if (_alreadyActualNetwork) {
+        return;
+    }
+    if (_cpuFuture.valid() && _acceleratorFuture.valid()) {
+        try {
+            _networkFirstReady = _cpuFuture.get();
+        } catch (const std::exception& e) {
+            printf("Warning: load network to CPU failed: %s\n", e.what());
+            _networkActualNeeded = _acceleratorFuture.get();
+        }
+    } else if (_acceleratorFuture.valid()) {  // only accelerator is valid, like AUTO:GPU
+        _networkActualNeeded = _acceleratorFuture.get();
+    } else if (_cpuFuture.valid()) {  // only CPU is valid, like AUTO:CPU
+        _networkActualNeeded = _cpuFuture.get();
+    } else {
+        IE_THROW() << "No device task available";
+    }
+
+    // if there is only one device or loading CPU device is failed,
+    // the ActualNetwork is already ok now.
+    if (!_acceleratorFuture.valid()) {
+        _alreadyActualNetwork = true;
+    }
+}
+
+void MultiDeviceExecutableNetwork::WaitActualNetworkReady() const {
+    // Maybe different API will call this function, so add call once here
+    // for every MultiDeviceExecutableNetwork instance
+    std::call_once(_oc, [&] () {
+            if (_acceleratorFuture.valid()) {
+                _networkActualNeeded = _acceleratorFuture.get();
+            }
+            });
+}
+
 void MultiDeviceExecutableNetwork::ScheduleToWorkerInferRequest(Task inferPipelineTask, DeviceName preferred_device) {
-    auto devices = [&] {
-        std::lock_guard<std::mutex> lock(_mutex);
-        return _devicePriorities;
-    }();
+    std::vector<DeviceInformation> devices;
+    // AUTO work mode
+    if (_workModeIsAUTO) {
+        if (!preferred_device.empty()) {
+            // the preferred_device should be the selected device in AUTO work mode
+            if (preferred_device != _acceleratorDevice.deviceName) {
+                IE_THROW(NotFound) << "The preferred_device should be the selected device";
+            }
+            // if the device needed by customer is not ready, need to wait for it
+            WaitActualNetworkReady();
+            devices.push_back(_acceleratorDevice);
+        } else {
+            // _acceleratorDevice could be the same as _cpuDevice, such as AUTO:CPU
+            if (_alreadyActualNetwork) {
+                devices.push_back(_acceleratorDevice);
+            } else {
+                devices.push_back(_cpuDevice);
+            }
+        }
+    } else {
+        devices = [&] {
+            std::lock_guard<std::mutex> lock(_mutex);
+            return _devicePriorities;
+        }();
+    }
     for (auto&& device : devices) {
         if (!preferred_device.empty() && (device.deviceName != preferred_device))
             continue;
-        WorkerInferRequest* workerRequestPtr = nullptr;
-        NotBusyWorkerRequests& idleWorkerRequests = _idleWorkerRequests[device.deviceName];
-        if (idleWorkerRequests.try_pop(workerRequestPtr)) {
-            IdleGuard idleGuard{workerRequestPtr, idleWorkerRequests};
-            _thisWorkerInferRequest = workerRequestPtr;
-            {
-                auto capturedTask = std::move(inferPipelineTask);
-                capturedTask();
-            }
-            idleGuard.Release();
+        if (RunPipelineTask(inferPipelineTask, _idleWorkerRequests[device.deviceName], preferred_device)) {
             return;
         }
     }
+
     // no vacant requests this time, storing the task to the respective queue
     if (!preferred_device.empty())
         _inferPipelineTasksDeviceSpecific[preferred_device]->push(std::move(inferPipelineTask));
@@ -135,11 +306,35 @@ void MultiDeviceExecutableNetwork::ScheduleToWorkerInferRequest(Task inferPipeli
         _inferPipelineTasks.push(std::move(inferPipelineTask));
 }
 
+bool MultiDeviceExecutableNetwork::RunPipelineTask(Task& inferPipelineTask,
+                                            NotBusyWorkerRequests& idleWorkerRequests,
+                                            const DeviceName& preferred_device) {
+  WorkerInferRequest *workerRequestPtr = nullptr;
+  if (idleWorkerRequests.try_pop(workerRequestPtr)) {
+      IdleGuard idleGuard{workerRequestPtr, idleWorkerRequests};
+      _thisWorkerInferRequest = workerRequestPtr;
+      {
+          auto capturedTask = std::move(inferPipelineTask);
+          capturedTask();
+      }
+      idleGuard.Release();
+      return true;
+  }
+  return false;
+}
+
 void MultiDeviceExecutableNetwork::run(Task inferPipelineTask) {
     ScheduleToWorkerInferRequest(std::move(inferPipelineTask), _thisPreferredDeviceName);
 }
 
 MultiDeviceExecutableNetwork::~MultiDeviceExecutableNetwork() {
+    // this is necessary to guarantee member destroyed after getting future
+    if (_workModeIsAUTO) {
+        WaitActualNetworkReady();
+        // it's necessary to wait the loading network threads to stop here.
+        InferenceEngine::ExecutorManager::getInstance()->clear("AutoDeviceAsyncLoad");
+        _executor.reset();
+    }
     {
         std::lock_guard<std::mutex> lock(_mutex);
         _devicePriorities.clear();
@@ -147,14 +342,19 @@ MultiDeviceExecutableNetwork::~MultiDeviceExecutableNetwork() {
     /* NOTE: The only threads that use `MultiDeviceExecutableNetwork` worker infer requests' threads.
      *       But AsyncInferRequest destructor should wait for all asynchronous tasks by the request
      */
-    for (auto&& networkValue : _networksPerDevice) {
+    for (auto&& idleWorker : _idleWorkerRequests) {
         // stop accepting any idle requests back (for re-scheduling)
-        _idleWorkerRequests.at(networkValue.first).set_capacity(0);
+        idleWorker.second.set_capacity(0);
     }
     _workerRequests.clear();
 }
 
 std::shared_ptr<InferenceEngine::RemoteContext> MultiDeviceExecutableNetwork::GetContext() const {
+    if (_workModeIsAUTO) {
+        WaitActualNetworkReady();
+        return _networkActualNeeded->GetContext();
+    }
+
     auto devices = [&] {
         std::lock_guard<std::mutex> lock(_mutex);
         return _devicePriorities;
@@ -177,6 +377,11 @@ InferenceEngine::IInferRequestInternal::Ptr MultiDeviceExecutableNetwork::Create
     auto num = _numRequestsCreated++;
     size_t sum = 0;
     InferenceEngine::SoIInferRequestInternal request_to_share_blobs_with;
+
+    if (_workModeIsAUTO) {
+        return std::make_shared<MultiDeviceInferRequest>(networkInputs, networkOutputs, request_to_share_blobs_with);
+    }
+
     // borrowing device-specific blobs from the underlying requests for the device-agnostic, user-facing requests
     // this allows to potentially save on the data-copy later (if the requests are scheduled in the same order)
     for (const auto& device : _devicePrioritiesInitial) {
@@ -200,6 +405,10 @@ IInferRequestInternal::Ptr MultiDeviceExecutableNetwork::CreateInferRequest() {
 }
 
 void MultiDeviceExecutableNetwork::SetConfig(const std::map<std::string, InferenceEngine::Parameter> &config) {
+    if (_workModeIsAUTO) {
+        IE_THROW(NotImplemented);
+    }
+
     auto priorities = config.find(MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES);
     if (priorities == config.end() || config.size() > 1) {
         IE_THROW() << "The only config supported for the Network's SetConfig is MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES";
@@ -252,6 +461,15 @@ InferenceEngine::Parameter MultiDeviceExecutableNetwork::GetConfig(const std::st
 }
 
 InferenceEngine::Parameter MultiDeviceExecutableNetwork::GetMetric(const std::string &name) const {
+    if (_workModeIsAUTO) {
+        // fixme: should we wait actual device? meanwhile it will block inference, how to fix?
+        if (_alreadyActualNetwork) {
+            WaitActualNetworkReady();
+            return _networkActualNeeded->GetMetric(name);
+        }
+        return _networkFirstReady->GetMetric(name);
+    }
+
     if (name == METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS)) {
         unsigned int res = 0u;
         for (auto n : _networksPerDevice) {
@@ -284,5 +502,4 @@ InferenceEngine::Parameter MultiDeviceExecutableNetwork::GetMetric(const std::st
         IE_THROW() << "Unsupported Network metric: " << name;
     }
 }
-
 }  // namespace MultiDevicePlugin
diff --git a/inference-engine/src/multi_device/multi_device_exec_network.hpp b/inference-engine/src/multi_device/multi_device_exec_network.hpp
index 2fb6e9462a7..2fd86c63170 100644
--- a/inference-engine/src/multi_device/multi_device_exec_network.hpp
+++ b/inference-engine/src/multi_device/multi_device_exec_network.hpp
@@ -16,14 +16,21 @@
 #include <cpp_interfaces/impl/ie_executable_network_thread_safe_default.hpp>
 #include <ie_parallel.hpp>
 #include <threading/ie_itask_executor.hpp>
+#include <threading/ie_executor_manager.hpp>
+#include "ie_icore.hpp"
 
 #if (IE_THREAD == IE_THREAD_TBB || IE_THREAD == IE_THREAD_TBB_AUTO)
 # include <tbb/concurrent_queue.h>
 #endif
 
+
 namespace MultiDevicePlugin {
 
+class MultiDeviceInferencePlugin;
+
 using DeviceName = std::string;
+using NetworkFuture = std::future<InferenceEngine::SoExecutableNetworkInternal>;
+using NetworkPromise = std::promise<InferenceEngine::SoExecutableNetworkInternal>;
 
 struct DeviceInformation {
     DeviceName deviceName;
@@ -105,10 +112,16 @@ public:
     };
     using NotBusyWorkerRequests = ThreadSafeBoundedQueue<WorkerInferRequest*>;
 
-    explicit MultiDeviceExecutableNetwork(const DeviceMap<InferenceEngine::SoExecutableNetworkInternal>&                  networksPerDevice,
+    explicit MultiDeviceExecutableNetwork(const DeviceMap<InferenceEngine::SoExecutableNetworkInternal>&        networksPerDevice,
                                           const std::vector<DeviceInformation>&                                 networkDevices,
                                           const std::unordered_map<std::string, InferenceEngine::Parameter>&    config,
                                           const bool                                                            needPerfCounters = false);
+    MultiDeviceExecutableNetwork(const std::string&                           modelPath,
+                                 const InferenceEngine::CNNNetwork&           network,
+                                 const std::vector<DeviceInformation>&        metaDevices,
+                                 const std::string&                           strDevices,
+                                 MultiDeviceInferencePlugin*                  plugin,
+                                 const bool                                   needPerfCounters = false);
 
     void SetConfig(const std::map<std::string, InferenceEngine::Parameter> &config) override;
     InferenceEngine::Parameter GetConfig(const std::string &name) const override;
@@ -138,6 +151,30 @@ public:
     std::unordered_map<std::string, InferenceEngine::Parameter> _config;
     bool                                                        _needPerfCounters = false;
     std::atomic_size_t                                          _numRequestsCreated = {0};
+
+private:
+    void GenerateWorkers(const std::string& device, const InferenceEngine::SoExecutableNetworkInternal& executableNetwork);
+    void WaitActualNetworkReady() const;
+    void WaitFirstNetworkReady();
+    static bool RunPipelineTask(InferenceEngine::Task& inferPipelineTask,
+                                NotBusyWorkerRequests& idleWorkerRequests,
+                                const DeviceName& preferred_device);
+
+private:
+    std::shared_ptr<InferenceEngine::ICore>                             _core;
+    InferenceEngine::IStreamsExecutor::Ptr                              _executor;
+    MultiDeviceInferencePlugin*                                         _multiPlugin;
+    InferenceEngine::SoExecutableNetworkInternal                        _networkFirstReady;
+    mutable InferenceEngine::SoExecutableNetworkInternal                _networkActualNeeded;
+    NetworkFuture                                                       _cpuFuture;
+    NetworkPromise                                                      _cpuPromise;
+    mutable NetworkFuture                                               _acceleratorFuture;
+    mutable NetworkPromise                                              _acceleratorPromise;
+    mutable bool                                                        _alreadyActualNetwork = {false};
+    bool                                                                _workModeIsAUTO = {false};
+    DeviceInformation                                                   _cpuDevice;
+    DeviceInformation                                                   _acceleratorDevice;
+    mutable std::once_flag                                              _oc;
 };
 
 }  // namespace MultiDevicePlugin
diff --git a/inference-engine/src/multi_device/multi_device_plugin.cpp b/inference-engine/src/multi_device/multi_device_plugin.cpp
index f63bcde8c4d..b4f6e3aa49e 100644
--- a/inference-engine/src/multi_device/multi_device_plugin.cpp
+++ b/inference-engine/src/multi_device/multi_device_plugin.cpp
@@ -219,34 +219,50 @@ IExecutableNetworkInternal::Ptr MultiDeviceInferencePlugin::LoadNetworkImpl(cons
     bool workModeAuto = workMode != fullConfig.end() && workMode->second == InferenceEngine::PluginConfigParams::YES;
     auto priorities = fullConfig.find(MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES);
 
-    // not found device priorities for -d AUTO use case
-    if (priorities == fullConfig.end()) {
-        if (workModeAuto) {
-            std::string allDevices;
-            auto availableDevices = GetCore()->GetAvailableDevices();
-            if (availableDevices.empty()) {
-                IE_THROW(NotFound) << "No available device found";
-            }
-            for (auto&& device : availableDevices) {
-                allDevices += device;
-                allDevices += ((device == availableDevices[availableDevices.size()-1]) ? "" : ",");
-            }
-            metaDevices = ParseMetaDevices(allDevices, fullConfig);
-            multiNetworkConfig.insert({MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES, allDevices});
-        } else {
-            IE_THROW() << "KEY_MULTI_DEVICE_PRIORITIES key is not set for " << GetName() << " device";
+    // if workMode is AUTO
+    if (workModeAuto) {
+        // check the configure and check if need to set PerfCounters configure to device
+        // and set filter configure
+        bool needPerfCounters = false;
+        std::map<std::string, std::string> filterConfig;
+        CheckConfig(fullConfig, needPerfCounters, filterConfig);
+        // filter the device that supports filter configure
+        auto strDevices = GetDeviceList(fullConfig);
+        auto metaDevices = ParseMetaDevices(strDevices, fullConfig);
+        auto supportDevices = FilterDevice(metaDevices, filterConfig);
+        if (supportDevices.size() == 0) {
+             IE_THROW() << "there is no device support the configure";
         }
+        // replace the configure with configure that auto want to pass to device
+        // and reset the strDevices to support devices
+        std::vector<std::string> validConfigKey;
+        validConfigKey.push_back(PluginConfigParams::KEY_PERF_COUNT);
+        validConfigKey.push_back(PluginConfigParams::KEY_EXCLUSIVE_ASYNC_REQUESTS);
+        validConfigKey.push_back(PluginConfigParams::KEY_PERFORMANCE_HINT);
+        validConfigKey.push_back(PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS);
+        strDevices = "";
+        for (auto iter = supportDevices.begin(); iter != supportDevices.end(); iter++) {
+             std::map<std::string, std::string> deviceConfig;
+             auto& configs = iter->config;
+             for (auto& config : configs) {
+                 if (std::find(validConfigKey.begin(), validConfigKey.end(), config.first) != validConfigKey.end()) {
+                     deviceConfig.insert({config.first, config.second});
+                 }
+             }
+             iter->config = deviceConfig;
+             strDevices = iter->deviceName;
+             strDevices += ((iter + 1) == supportDevices.end()) ? "" : ",";
+        }
+
+        return std::make_shared<MultiDeviceExecutableNetwork>(modelPath, network, supportDevices, strDevices, this, needPerfCounters);
+    }
+
+    if (priorities == fullConfig.end()) {
+        IE_THROW() << "KEY_MULTI_DEVICE_PRIORITIES key is not set for " << GetName() << " device";
     } else {  // for use case -d MULTI:xPU or -d AUTO:xPU
         metaDevices = ParseMetaDevices(priorities->second, fullConfig);
         multiNetworkConfig.insert(*priorities);
     }
-    // check if it is -d AUTO or -d AUTO:xPU use case
-    if (workModeAuto) {
-        // select the device
-        auto device = SelectDevice(metaDevices, networkPrecision).deviceName;
-        // parse the config for the device
-        metaDevices = ParseMetaDevices(SelectDevice(metaDevices, networkPrecision).deviceName, fullConfig);
-    }
 
     DeviceMap<SoExecutableNetworkInternal> executableNetworkPerDevice;
     std::mutex load_mutex;
@@ -345,7 +361,6 @@ QueryNetworkResult MultiDeviceInferencePlugin::QueryNetwork(const CNNNetwork&
     return queryResult;
 }
 
-
 DeviceInformation MultiDeviceInferencePlugin::SelectDevice(const std::vector<DeviceInformation>& metaDevices, const std::string& networkPrecision) {
     if (metaDevices.empty()) {
         IE_THROW(NotFound) << "No available device to select in " << GetName() <<  " plugin";
@@ -466,4 +481,94 @@ DeviceInformation MultiDeviceInferencePlugin::SelectDevice(const std::vector<Dev
     return CPU[0];
 }
 
+std::string MultiDeviceInferencePlugin::GetDeviceList(const std::map<std::string, std::string>& config) const {
+    std::string allDevices;
+
+    auto deviceListConfig = config.find(MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES);
+    if (deviceListConfig == config.end()) {
+        auto deviceList = GetCore()->GetAvailableDevices();
+        for (auto&& device : deviceList) {
+            allDevices += device;
+            allDevices += ((device == deviceList[deviceList.size()-1]) ? "" : ",");
+        }
+    } else {
+        allDevices = deviceListConfig->second;
+    }
+
+    if (allDevices.empty()) {
+        IE_THROW() << "Please, check environment due to no supported devices can be used";
+    }
+
+    return allDevices;
+}
+
+void MultiDeviceInferencePlugin::CheckConfig(const std::map<std::string, std::string>& config,
+        bool& needPerfCounters, std::map<std::string, std::string>& filterConfig) {
+    // TODO need to optimize this code, too much duplicated code
+    const auto perf_hints_configs = PerfHintsConfig::SupportedKeys();
+    for (auto&& kvp : config) {
+        if (kvp.first.find("AUTO_") == 0) {
+            continue;
+        } else if (kvp.first == PluginConfigParams::KEY_PERF_COUNT) {
+            if (kvp.second == PluginConfigParams::YES) {
+                needPerfCounters = true;
+                filterConfig.insert({kvp.first, kvp.second});
+            } else if (kvp.second == PluginConfigParams::NO) {
+                needPerfCounters = false;
+            } else {
+                IE_THROW() << "Unsupported config value: " << kvp.second
+                           << " for key: " << kvp.first;
+            }
+        } else if (kvp.first == PluginConfigParams::KEY_EXCLUSIVE_ASYNC_REQUESTS) {
+            if (kvp.second == PluginConfigParams::YES ||
+                kvp.second == PluginConfigParams::NO) {
+                continue;
+            } else {
+                IE_THROW() << "Unsupported config value: " << kvp.second
+                           << " for key: " << kvp.first;
+            }
+        } else if (std::find(perf_hints_configs.begin(), perf_hints_configs.end(), kvp.first) != perf_hints_configs.end()) {
+            PerfHintsConfig::CheckConfigAndValue(kvp);
+        } else if (supported_configKeys.end() == std::find(supported_configKeys.begin(), supported_configKeys.end(), kvp.first)) {
+            IE_THROW() << "Unsupported config key: " << kvp.first;
+        }
+    }
+}
+
+std::vector<DeviceInformation> MultiDeviceInferencePlugin::FilterDevice(const std::vector<DeviceInformation>& metaDevices,
+        const std::map<std::string, std::string>& config) {
+    if (metaDevices.empty()) {
+        IE_THROW(NotFound) << "No available device to filter " << GetName() <<  " plugin";
+    }
+
+    if (config.size() == 0) {
+        return metaDevices;
+    }
+
+    std::vector<DeviceInformation> filterDevice;
+    for (auto&& item : metaDevices) {
+        bool support = true;
+        std::vector<std::string> supportedMetrics = GetCore()->GetMetric(item.deviceName, METRIC_KEY(SUPPORTED_METRICS));
+        if (std::find(supportedMetrics.begin(), supportedMetrics.end(), METRIC_KEY(SUPPORTED_CONFIG_KEYS)) != supportedMetrics.end()) {
+            std::vector<std::string> supportKeys = GetCore()->GetMetric(item.deviceName, METRIC_KEY(SUPPORTED_CONFIG_KEYS));
+            for (auto&& kvp : config) {
+                auto targetKey = std::find(supportKeys.begin(), supportKeys.end(), kvp.first);
+                // if device have the key, we think the device support it
+                if (targetKey != supportKeys.end()) {
+                    continue;
+                } else {
+                    support = false;
+                    break;
+                }
+            }
+        } else {
+            support = false;
+        }
+
+        if (support) {
+            filterDevice.push_back(item);
+        }
+    }
+    return filterDevice;
+}
 }  // namespace MultiDevicePlugin
diff --git a/inference-engine/src/multi_device/multi_device_plugin.hpp b/inference-engine/src/multi_device/multi_device_plugin.hpp
index 4021c5ec9e1..f6f0ed39809 100644
--- a/inference-engine/src/multi_device/multi_device_plugin.hpp
+++ b/inference-engine/src/multi_device/multi_device_plugin.hpp
@@ -36,6 +36,9 @@ public:
     std::vector<MultiDevicePlugin::DeviceInformation> ParseMetaDevices(const std::string & devicesRequestsCfg,
                                                                        const std::map<std::string, std::string> & config) const;
 
+    std::string GetDeviceList(const std::map<std::string, std::string>& config) const;
+    DeviceInformation SelectDevice(const std::vector<DeviceInformation>& metaDevices, const std::string& networkPrecision = METRIC_VALUE(FP32));
+
 protected:
     std::map<std::string, std::string> GetSupportedConfig(const std::map<std::string, std::string>& config,
                                                           const MultiDevicePlugin::DeviceName & deviceName) const;
@@ -45,7 +48,10 @@ private:
                                                                        InferenceEngine::CNNNetwork network,
                                                                        const std::map<std::string, std::string>& config,
                                                                        const std::string &networkPrecision = METRIC_VALUE(FP32));
-    DeviceInformation SelectDevice(const std::vector<DeviceInformation>& metaDevices, const std::string& networkPrecision = METRIC_VALUE(FP32));
+    static void CheckConfig(const std::map<std::string, std::string>& config, bool& needPerfCounters,
+                            std::map<std::string, std::string>& filterConfig);
+    std::vector<DeviceInformation> FilterDevice(const std::vector<DeviceInformation>& metaDevices,
+                                                const std::map<std::string, std::string>& config);
 };
 
 }  // namespace MultiDevicePlugin
diff --git a/inference-engine/src/offline_transformations/src/pruning/pruning.cpp b/inference-engine/src/offline_transformations/src/pruning/pruning.cpp
index ad7f410b8f3..9d80dcb1403 100644
--- a/inference-engine/src/offline_transformations/src/pruning/pruning.cpp
+++ b/inference-engine/src/offline_transformations/src/pruning/pruning.cpp
@@ -2,14 +2,14 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include <algorithm>
-
 #include "pruning.hpp"
-#include "mask_attribute.hpp"
 
-#include <ngraph/pass/visualize_tree.hpp>
-#include <ngraph/pass/constant_folding.hpp>
+#include <algorithm>
 #include <ngraph/log.hpp>
+#include <ngraph/pass/constant_folding.hpp>
+#include <ngraph/pass/visualize_tree.hpp>
+
+#include "mask_attribute.hpp"
 
 NGRAPH_RTTI_DEFINITION(ngraph::pass::Pruning, "Pruning", 0);
 
@@ -21,8 +21,7 @@ bool ngraph::pass::Pruning::run_on_function(std::shared_ptr<Function> f) {
     manager.register_pass<InitMasks>();
     manager.register_pass<PropagateMasks>();
 
-
-#ifdef NGRAPH_DEBUG_ENABLE
+#ifdef OPENVINO_DEBUG_ENABLE
     // VisualizeTree modifier helps to print Masks and mark nodes with masks
     /*
     auto modifier = [](const Node& node, std::vector<std::string>& attributes) {
@@ -57,11 +56,11 @@ bool ngraph::pass::Pruning::run_on_function(std::shared_ptr<Function> f) {
 
     manager.register_pass<ShrinkWeights>();
 
-#ifdef NGRAPH_DEBUG_ENABLE
+#ifdef OPENVINO_DEBUG_ENABLE
     // Uncomment following line and change path to resulting svg file
     // manager.register_pass<VisualizeTree>("/tmp/after.svg");
 #endif
 
     manager.run_passes(f);
     return true;
-}
\ No newline at end of file
+}
diff --git a/inference-engine/src/plugin_api/file_utils.h b/inference-engine/src/plugin_api/file_utils.h
index 74883f11635..cad183071b2 100644
--- a/inference-engine/src/plugin_api/file_utils.h
+++ b/inference-engine/src/plugin_api/file_utils.h
@@ -15,72 +15,10 @@
 
 #include "ie_api.h"
 #include "details/ie_so_pointer.hpp"
+#include "openvino/util/file_util.hpp"
 
 namespace FileUtils {
 
-#ifdef ENABLE_UNICODE_PATH_SUPPORT
-
-/**
- * @brief Conversion from wide character string to a single-byte chain.
- * @param wstr A wide-char string
- * @return A multi-byte string
- */
-INFERENCE_ENGINE_API_CPP(std::string) wStringtoMBCSstringChar(const std::wstring& wstr);
-
-/**
- * @brief Conversion from single-byte chain to wide character string.
- * @param str A null-terminated string
- * @return A wide-char string
- */
-INFERENCE_ENGINE_API_CPP(std::wstring) multiByteCharToWString(const char* str);
-
-#endif  // ENABLE_UNICODE_PATH_SUPPORT
-
-template <typename T> struct FileTraits;
-
-#ifdef _WIN32
-
-/// @brief File path separator
-const char FileSeparator = '\\';
-
-template<> struct FileTraits<char> {
-    constexpr static const auto FileSeparator = ::FileUtils::FileSeparator;
-    static std::string PluginLibraryPrefix() { return { }; }
-    static std::string PluginLibraryExt() { return { "dll" }; }
-};
-template<> struct FileTraits<wchar_t> {
-    constexpr static const auto FileSeparator = L'\\';
-    static std::wstring PluginLibraryPrefix() { return { }; }
-    static std::wstring PluginLibraryExt() { return { L"dll" }; }
-};
-#elif defined __APPLE__
-/// @brief File path separator
-const char FileSeparator = '/';
-template<> struct FileTraits<char> {
-    constexpr static const auto FileSeparator = ::FileUtils::FileSeparator;
-    static std::string PluginLibraryPrefix() { return { "lib" }; }
-    static std::string PluginLibraryExt() { return { "so" }; }
-};
-template<> struct FileTraits<wchar_t> {
-    constexpr static const auto FileSeparator = L'/';
-    static std::wstring PluginLibraryPrefix() { return { L"lib" }; }
-    static std::wstring PluginLibraryExt() { return { L"so" }; }
-};
-#else
-/// @brief File path separator
-const char FileSeparator = '/';
-template<> struct FileTraits<char> {
-    constexpr static const auto FileSeparator = ::FileUtils::FileSeparator;
-    static std::string PluginLibraryPrefix() { return { "lib" }; }
-    static std::string PluginLibraryExt() { return { "so" }; }
-};
-template<> struct FileTraits<wchar_t> {
-    constexpr static const auto FileSeparator = L'/';
-    static std::wstring PluginLibraryPrefix() { return { L"lib" }; }
-    static std::wstring PluginLibraryExt() { return { L"so" }; }
-};
-#endif
-
 /**
  * @brief Interface function to get absolute path of file
  * @ingroup ie_dev_api_file_utils
@@ -125,7 +63,7 @@ INFERENCE_ENGINE_API(long long) fileSize(const char *fileName);
  * @return     { description_of_the_return_value }
  */
 inline long long fileSize(const wchar_t* fileName) {
-    return fileSize(::FileUtils::wStringtoMBCSstringChar(fileName).c_str());
+    return fileSize(::ov::util::wstring_to_string(fileName).c_str());
 }
 
 #endif  // ENABLE_UNICODE_PATH_SUPPORT
@@ -175,13 +113,9 @@ template <typename C, typename = InferenceEngine::details::enableIfSupportedChar
 inline std::basic_string<C> makePath(const std::basic_string<C> &folder, const std::basic_string<C> &file) {
     if (folder.empty())
         return file;
-    return folder + FileTraits<C>::FileSeparator + file;
+    return folder + ov::util::FileTraits<C>::file_separator + file;
 }
 
-template <typename C> struct DotSymbol;
-template <> struct DotSymbol<char> { constexpr static const char value = '.'; };
-template <> struct DotSymbol<wchar_t> { constexpr static const wchar_t value = L'.'; };
-
 /**
  * @brief CPP Interface function to extract extension from filename
  * @ingroup ie_dev_api_file_utils
@@ -190,7 +124,7 @@ template <> struct DotSymbol<wchar_t> { constexpr static const wchar_t value = L
  */
 template <typename C, typename = InferenceEngine::details::enableIfSupportedChar<C>>
 inline std::basic_string<C> fileExt(const std::basic_string<C> &filename) {
-    auto pos = filename.rfind(DotSymbol<C>::value);
+    auto pos = filename.rfind(ov::util::FileTraits<C>::dot_symbol);
     if (pos == std::string::npos)
         return {};
     return filename.substr(pos + 1);
@@ -198,38 +132,12 @@ inline std::basic_string<C> fileExt(const std::basic_string<C> &filename) {
 
 template <typename C, typename = InferenceEngine::details::enableIfSupportedChar<C>>
 inline std::basic_string<C> makePluginLibraryName(const std::basic_string<C> &path, const std::basic_string<C> &input) {
-    std::basic_string<C> separator(1, FileTraits<C>::FileSeparator);
+    std::basic_string<C> separator(1, ov::util::FileTraits<C>::file_separator);
     if (path.empty())
         separator = {};
-    return path + separator + FileTraits<C>::PluginLibraryPrefix() + input + DotSymbol<C>::value + FileTraits<C>::PluginLibraryExt();
+    return path + separator + ov::util::FileTraits<C>::library_prefix() + input + ov::util::FileTraits<C>::dot_symbol + ov::util::FileTraits<C>::library_ext();
 }
 
-#ifdef ENABLE_UNICODE_PATH_SUPPORT
-
-using FilePath = std::wstring;
-
-inline std::string fromFilePath(const FilePath & path) {
-    return ::FileUtils::wStringtoMBCSstringChar(path);
-}
-
-inline FilePath toFilePath(const std::string & path) {
-    return ::FileUtils::multiByteCharToWString(path.c_str());
-}
-
-#else
-
-using FilePath = std::string;
-
-inline std::string fromFilePath(const FilePath & path) {
-    return path;
-}
-
-inline FilePath toFilePath(const std::string & path) {
-    return path;
-}
-
-#endif  // ENABLE_UNICODE_PATH_SUPPORT
-
 }  // namespace FileUtils
 // clang-format on
 
@@ -251,13 +159,13 @@ INFERENCE_ENGINE_API_CPP(std::string) getIELibraryPath();
  */
 INFERENCE_ENGINE_API_CPP(std::wstring) getIELibraryPathW();
 
-inline ::FileUtils::FilePath getInferenceEngineLibraryPath() {
+inline ::ov::util::FilePath getInferenceEngineLibraryPath() {
     return getIELibraryPathW();
 }
 
 #else
 
-inline ::FileUtils::FilePath getInferenceEngineLibraryPath() {
+inline ::ov::util::FilePath getInferenceEngineLibraryPath() {
     return getIELibraryPath();
 }
 
diff --git a/inference-engine/src/plugin_api/xml_parse_utils.h b/inference-engine/src/plugin_api/xml_parse_utils.h
index 7ce0ee46927..af70ff03bd6 100644
--- a/inference-engine/src/plugin_api/xml_parse_utils.h
+++ b/inference-engine/src/plugin_api/xml_parse_utils.h
@@ -255,7 +255,7 @@ struct parse_result {
  */
 inline parse_result ParseXml(const char* file_path) {
 #ifdef ENABLE_UNICODE_PATH_SUPPORT
-    std::wstring wFilePath = FileUtils::multiByteCharToWString(file_path);
+    std::wstring wFilePath = ov::util::string_to_wstring(file_path);
     const wchar_t* resolvedFilepath = wFilePath.c_str();
 #else
     const char* resolvedFilepath = file_path;
diff --git a/inference-engine/src/preprocessing/CMakeLists.txt b/inference-engine/src/preprocessing/CMakeLists.txt
index a118f638c6a..feee8b4cb84 100644
--- a/inference-engine/src/preprocessing/CMakeLists.txt
+++ b/inference-engine/src/preprocessing/CMakeLists.txt
@@ -123,7 +123,7 @@ ie_add_vs_version_file(NAME ${TARGET_NAME}
 
 set_ie_threading_interface_for(${TARGET_NAME})
 
-target_link_libraries(${TARGET_NAME} PRIVATE fluid openvino::itt
+target_link_libraries(${TARGET_NAME} PRIVATE fluid openvino::itt openvino::util
                                      PUBLIC inference_engine)
 
 target_include_directories(${TARGET_NAME} INTERFACE "${CMAKE_CURRENT_SOURCE_DIR}")
diff --git a/inference-engine/src/preprocessing/ie_preprocess_data.hpp b/inference-engine/src/preprocessing/ie_preprocess_data.hpp
index fab055000ca..24687d074b3 100644
--- a/inference-engine/src/preprocessing/ie_preprocess_data.hpp
+++ b/inference-engine/src/preprocessing/ie_preprocess_data.hpp
@@ -88,12 +88,12 @@ public:
 using PreProcessDataPtr = InferenceEngine::details::SOPointer<IPreProcessData>;
 
 inline PreProcessDataPtr CreatePreprocDataHelper() {
-    FileUtils::FilePath libraryName = FileUtils::toFilePath(std::string("inference_engine_preproc") + std::string(IE_BUILD_POSTFIX));
-    FileUtils::FilePath preprocLibraryPath = FileUtils::makePluginLibraryName(getInferenceEngineLibraryPath(), libraryName);
+    ov::util::FilePath libraryName = ov::util::to_file_path(std::string("inference_engine_preproc") + std::string(IE_BUILD_POSTFIX));
+    ov::util::FilePath preprocLibraryPath = FileUtils::makePluginLibraryName(getInferenceEngineLibraryPath(), libraryName);
 
     if (!FileUtils::fileExist(preprocLibraryPath)) {
         IE_THROW() << "Please, make sure that pre-processing library "
-            << FileUtils::fromFilePath(::FileUtils::makePluginLibraryName({}, libraryName)) << " is in "
+            << ov::util::from_file_path(::FileUtils::makePluginLibraryName({}, libraryName)) << " is in "
             << getIELibraryPath();
     }
     return {preprocLibraryPath};
diff --git a/inference-engine/src/readers/CMakeLists.txt b/inference-engine/src/readers/CMakeLists.txt
index b1864152ade..83c7cbc629c 100644
--- a/inference-engine/src/readers/CMakeLists.txt
+++ b/inference-engine/src/readers/CMakeLists.txt
@@ -15,5 +15,4 @@ file(GLOB_RECURSE reader_api_hpp "${CMAKE_CURRENT_SOURCE_DIR}/reader_api/*.hpp")
 
 add_cpplint_target(${TARGET_NAME}_cpplint FOR_SOURCES ${reader_api_hpp})
 
-add_subdirectory(ir_reader)
 add_subdirectory(ir_reader_v7)
diff --git a/inference-engine/src/readers/ir_reader/CMakeLists.txt b/inference-engine/src/readers/ir_reader/CMakeLists.txt
deleted file mode 100644
index 6433bd7cf1e..00000000000
--- a/inference-engine/src/readers/ir_reader/CMakeLists.txt
+++ /dev/null
@@ -1,52 +0,0 @@
-# Copyright (C) 2018-2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-#
-
-set(TARGET_NAME "inference_engine_ir_reader")
-
-file(GLOB_RECURSE LIBRARY_SRC ${CMAKE_CURRENT_SOURCE_DIR}/*.cpp
-                              ${CMAKE_CURRENT_SOURCE_DIR}/*.hpp)
-
-# Create named folders for the sources within the .vcproj
-# Empty name lists them directly under the .vcproj
-
-source_group("src" FILES ${LIBRARY_SRC})
-
-# Create module library
-
-add_library(${TARGET_NAME} MODULE ${LIBRARY_SRC})
-
-ie_faster_build(${TARGET_NAME}
-    UNITY
-)
-
-ie_add_vs_version_file(NAME ${TARGET_NAME}
-                       FILEDESCRIPTION "Inference Engine IR reader plugin")
-
-target_compile_definitions(${TARGET_NAME} PRIVATE IMPLEMENT_INFERENCE_ENGINE_PLUGIN
-                                                  IR_READER_V10)
-
-target_include_directories(${TARGET_NAME} PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
-
-target_link_libraries(${TARGET_NAME} PRIVATE ngraph
-                                             ir_frontend
-                                             frontend_manager
-                                             inference_engine_reader_api
-                                             inference_engine_plugin_api
-                                             inference_engine
-                                             inference_engine_transformations
-                                             pugixml::static
-                                             openvino::itt)
-
-ie_add_api_validator_post_build_step(TARGET ${TARGET_NAME})
-
-set_target_properties(${TARGET_NAME} PROPERTIES INTERPROCEDURAL_OPTIMIZATION_RELEASE ${ENABLE_LTO})
-
-# code style
-
-add_cpplint_target(${TARGET_NAME}_cpplint FOR_TARGETS ${TARGET_NAME})
-
-# install
-
-install(TARGETS ${TARGET_NAME}
-        LIBRARY DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT core)
diff --git a/inference-engine/src/readers/ir_reader/ie_ir_itt.hpp b/inference-engine/src/readers/ir_reader/ie_ir_itt.hpp
deleted file mode 100644
index 5fea9921564..00000000000
--- a/inference-engine/src/readers/ir_reader/ie_ir_itt.hpp
+++ /dev/null
@@ -1,21 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * @brief Defines openvino domains for tracing
- * @file itt.hpp
- */
-
-#pragma once
-
-#include <openvino/itt.hpp>
-
-namespace InferenceEngine {
-namespace itt {
-namespace domains {
-    OV_ITT_DOMAIN(V10Reader);
-    OV_ITT_DOMAIN(V10Reader_RT);
-}
-}
-}
diff --git a/inference-engine/src/readers/ir_reader/ie_ir_parser.cpp b/inference-engine/src/readers/ir_reader/ie_ir_parser.cpp
deleted file mode 100644
index 95d087a9d68..00000000000
--- a/inference-engine/src/readers/ir_reader/ie_ir_parser.cpp
+++ /dev/null
@@ -1,185 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include "ie_ir_parser.hpp"
-#include "ie_ir_itt.hpp"
-
-#include <memory>
-#include <ngraph/ngraph.hpp>
-#include <ngraph/op/util/sub_graph_base.hpp>
-#include <ir_frontend/frontend.hpp>
-#include <ngraph/ops.hpp>
-#include <sstream>
-#include <string>
-#include <typeinfo>
-#include <unordered_set>
-#include <vector>
-
-#include <cpp/ie_cnn_network.h>
-#include "blob_factory.hpp"
-
-using namespace XMLParseUtils;
-namespace InferenceEngine {
-
-IRParser::IRParser(size_t version) : IRParser(version, {}) {}
-
-IRParser::IRParser(size_t version, const std::vector<InferenceEngine::IExtensionPtr>& exts) {
-    switch (version) {
-    case 10:
-        parser = std::make_shared<V10Parser>(exts);
-        break;
-    default:
-        IE_THROW() << "Unsupported IR version: " << version;
-    }
-}
-
-CNNNetwork IRParser::parse(
-    const pugi::xml_node& root, const Blob::CPtr& weights) {
-    return parser->parse(root, weights);
-}
-
-V10Parser::V10Parser(const std::vector<IExtensionPtr>& exts) : _exts(exts) {}
-
-CNNNetwork V10Parser::parse(
-    const pugi::xml_node& root, const Blob::CPtr& weights) {
-
-    auto ir_fe = std::make_shared<ngraph::frontend::FrontEndIR>();
-    auto model = ir_fe->load(root, weights, _exts);
-    auto f = ir_fe->convert(model);
-
-    OV_ITT_SCOPE(FIRST_INFERENCE, itt::domains::V10Reader_RT, "ConstructCNNNetwork");
-
-    CNNNetwork net(f, _exts);
-    parsePreProcess(net, root, weights);
-
-    return net;
-}
-
-void V10Parser::parsePreProcess(
-    CNNNetwork& network, const pugi::xml_node& root, const Blob::CPtr& weights) {
-    /*
-        <pre-process mean-precision="FP32">
-        <channel id = ”0”>
-        <mean offset = "121930449" size = "51529" / >  // in case of array – ref to the .bin file
-        </channel>
-        </pre-process>
-    */
-
-    auto ppNode = root.child("pre-process");
-    if (ppNode.empty()) {
-        return;
-    }
-    // find out to what input this belongs to
-    std::string inputName;
-    InputInfo::Ptr preProcessInput;
-
-    inputName = GetStrAttr(ppNode, "reference-layer-name", "");
-    inputName = ngraph::trim(inputName);
-    if (inputName.empty()) {
-        // fallback (old format), look for the picture in the inputs
-        InputsDataMap inputs = network.getInputsInfo();
-
-        if (inputs.empty()) IE_THROW() << "network has no input";
-
-        for (auto i : inputs) {
-            if (i.second->getTensorDesc().getDims().size() == 4) {
-                preProcessInput = i.second;
-                break;
-            }
-        }
-        if (!preProcessInput) {
-            preProcessInput = inputs.begin()->second;
-        }
-
-        inputName = preProcessInput->name();
-    } else {
-        preProcessInput = network.getInputsInfo()[inputName];
-        if (!preProcessInput)
-            IE_THROW() << "pre-process name ref '" << inputName
-                               << "' refers to un-existing input";
-    }
-
-    // dims vector without batch size
-    SizeVector inputDims = preProcessInput->getTensorDesc().getDims();
-    size_t noOfChannels = 0, width = 0, height = 0;
-
-    if (inputDims.size() < 2) {
-        IE_THROW() << "network did not define input dimensions properly";
-    } else if (inputDims.size() == 2) {  // NC
-        noOfChannels = inputDims[1];
-        width = inputDims[1];
-        height = inputDims[0];
-    } else if (inputDims.size() == 3) {
-        width = inputDims[2];
-        height = inputDims[1];
-        noOfChannels = inputDims[0];
-    } else if (inputDims.size() == 4) {
-        width = inputDims[3];
-        height = inputDims[2];
-        noOfChannels = inputDims[1];
-    } else if (inputDims.size() == 5) {
-        width = inputDims[4];
-        height = inputDims[3];
-        noOfChannels = inputDims[2];
-    }
-
-    PreProcessInfo& pp = preProcessInput->getPreProcess();
-    pp.init(noOfChannels);
-
-    auto meanSegmentPrecision = GetPrecisionAttr(ppNode, "mean-precision", Precision::UNSPECIFIED);
-    if (!meanSegmentPrecision || meanSegmentPrecision == Precision::MIXED)
-        IE_THROW() << "mean blob defined without specifying precision.";
-
-    int lastChanNo = -1;
-    std::unordered_set<int> idsForMeanImage;
-
-    FOREACH_CHILD(chan, ppNode, "channel") {
-        int chanNo = GetIntAttr(chan, "id", lastChanNo + 1);
-        if (chanNo >= static_cast<int>(noOfChannels) || chanNo < 0) {
-            IE_THROW() << "Pre-process channel id invalid: " << chanNo;
-        }
-        lastChanNo = chanNo;
-
-        auto meanNode = chan.child("mean");
-        if (!meanNode.empty()) {
-            if (!meanNode.attribute("size")) {
-                IE_THROW() << "mean should have the attribute: size";
-            }
-            if (meanNode.attribute("size")) {
-                idsForMeanImage.insert(chanNo);
-                size_t size = static_cast<size_t>(GetIntAttr(meanNode, "size"));
-                size_t offset = static_cast<size_t>(GetIntAttr(meanNode, "offset"));
-                if (width * height * meanSegmentPrecision.size() != size) {
-                    IE_THROW() << "mean blob size mismatch expected input, got: " << size
-                                       << " extpecting " << width << " x " << height << " x "
-                                       << meanSegmentPrecision.size();
-                }
-                auto meanData = make_blob_with_precision(
-                    TensorDesc(meanSegmentPrecision, {height, width}, Layout::HW));
-                meanData->allocate();
-                auto lockedMem = meanData->buffer();
-                char* data = lockedMem.as<char*>();
-                uint8_t* src_data = weights->cbuffer().as<uint8_t*>() + offset;
-                memcpy(data, src_data, size);
-
-                pp.setMeanImageForChannel(meanData, chanNo);
-            }
-        }
-    }
-
-    if (idsForMeanImage.size() == noOfChannels) {
-        pp.setVariant(MEAN_IMAGE);
-    } else if (idsForMeanImage.size() == 0) {
-        pp.setVariant(NONE);
-    } else {
-        std::string validMeanImageIds = "";
-        for (auto id : idsForMeanImage) {
-            validMeanImageIds += std::to_string(id) + " ";
-        }
-        IE_THROW() << "mean is not provided for all channels\n"
-                              "Provided mean image for: "
-                           << validMeanImageIds;
-    }
-}
-}  // namespace InferenceEngine
diff --git a/inference-engine/src/readers/ir_reader_v7/CMakeLists.txt b/inference-engine/src/readers/ir_reader_v7/CMakeLists.txt
index 4ee39f31358..da35e298167 100644
--- a/inference-engine/src/readers/ir_reader_v7/CMakeLists.txt
+++ b/inference-engine/src/readers/ir_reader_v7/CMakeLists.txt
@@ -7,7 +7,6 @@ set(TARGET_NAME "inference_engine_ir_v7_reader")
 file(GLOB_RECURSE LIBRARY_SRC ${CMAKE_CURRENT_SOURCE_DIR}/*.cpp
                               ${CMAKE_CURRENT_SOURCE_DIR}/*.h
                               ${CMAKE_CURRENT_SOURCE_DIR}/*.hpp)
-list(APPEND LIBRARY_SRC ${IE_MAIN_SOURCE_DIR}/src/readers/ir_reader/ie_ir_reader.cpp)
 
 # Create named folders for the sources within the .vcproj
 # Empty name lists them directly under the .vcproj
@@ -27,8 +26,7 @@ ie_add_vs_version_file(NAME ${TARGET_NAME}
 
 target_compile_definitions(${TARGET_NAME} PRIVATE IMPLEMENT_INFERENCE_ENGINE_PLUGIN)
 
-target_include_directories(${TARGET_NAME} PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}/"
-                                                  "${IE_MAIN_SOURCE_DIR}/src/readers/ir_reader")
+target_include_directories(${TARGET_NAME} PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}/")
 
 target_link_libraries(${TARGET_NAME} PRIVATE inference_engine_reader_api inference_engine_plugin_api
                                              inference_engine_legacy inference_engine pugixml::static openvino::itt)
diff --git a/inference-engine/src/readers/ir_reader_v7/ie_cnn_net_reader_impl.cpp b/inference-engine/src/readers/ir_reader_v7/ie_cnn_net_reader_impl.cpp
index a839d2035b3..d7c1d2d9f66 100644
--- a/inference-engine/src/readers/ir_reader_v7/ie_cnn_net_reader_impl.cpp
+++ b/inference-engine/src/readers/ir_reader_v7/ie_cnn_net_reader_impl.cpp
@@ -72,7 +72,7 @@ void readAllFile(const std::string& string_file_name, void* buffer, size_t maxSi
     std::ifstream inputFile;
 
 #if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-    std::wstring file_name = FileUtils::multiByteCharToWString(string_file_name.c_str());
+    std::wstring file_name = ov::util::string_to_wstring(string_file_name.c_str());
 #else
     std::string file_name = string_file_name;
 #endif
diff --git a/inference-engine/src/readers/ir_reader/ie_ir_parser.hpp b/inference-engine/src/readers/ir_reader_v7/ie_ir_parser.hpp
similarity index 62%
rename from inference-engine/src/readers/ir_reader/ie_ir_parser.hpp
rename to inference-engine/src/readers/ir_reader_v7/ie_ir_parser.hpp
index 379dd9dfff4..49dcdd49482 100644
--- a/inference-engine/src/readers/ir_reader/ie_ir_parser.hpp
+++ b/inference-engine/src/readers/ir_reader_v7/ie_ir_parser.hpp
@@ -4,15 +4,6 @@
 
 #pragma once
 
-#ifdef IR_READER_V10
-#include <ie_ngraph_utils.hpp>
-#include <ngraph/node.hpp>
-#include <ngraph/op/util/sub_graph_base.hpp>
-#include <ngraph/op/util/variable.hpp>
-#include <ngraph/opsets/opset.hpp>
-#include <ngraph/opsets/opset5.hpp>
-#endif  // IR_READER_V10
-
 #include <cpp/ie_cnn_network.h>
 #include <ie_blob.h>
 #include <ie_iextension.h>
@@ -56,21 +47,4 @@ public:
         const pugi::xml_node& root, const Blob::CPtr& weights) override;
 };
 
-#ifdef IR_READER_V10
-class V10Parser : public IParser {
-public:
-    explicit V10Parser(const std::vector<IExtensionPtr>& exts);
-
-    CNNNetwork parse(
-        const pugi::xml_node& root, const Blob::CPtr& weights) override;
-
-private:
-    void parsePreProcess(
-        CNNNetwork& network, const pugi::xml_node& root, const Blob::CPtr& weights);
-
-    const std::vector<IExtensionPtr> _exts;
-};
-
-#endif  // IR_READER_V10
-
 }  // namespace InferenceEngine
diff --git a/inference-engine/src/readers/ir_reader/ie_ir_reader.cpp b/inference-engine/src/readers/ir_reader_v7/ie_ir_reader.cpp
similarity index 77%
rename from inference-engine/src/readers/ir_reader/ie_ir_reader.cpp
rename to inference-engine/src/readers/ir_reader_v7/ie_ir_reader.cpp
index 4133f7073ef..9ce2c29f1f9 100644
--- a/inference-engine/src/readers/ir_reader/ie_ir_reader.cpp
+++ b/inference-engine/src/readers/ir_reader_v7/ie_ir_reader.cpp
@@ -18,34 +18,22 @@
 using namespace InferenceEngine;
 
 bool IRReader::supportModel(std::istream& model) const {
-    OV_ITT_SCOPED_TASK(itt::domains::V10Reader, "IRReader::supportModel");
-
+    OV_ITT_SCOPED_TASK(itt::domains::V7Reader, "IRReader::supportModel");
     auto version = details::GetIRVersion(model);
-
-#ifdef IR_READER_V10
-    return version == 10;
-#else
     return version > 1 && version <= 7;
-#endif
 }
 
 CNNNetwork IRReader::read(std::istream& model, const std::vector<IExtensionPtr>& exts) const {
     return read(model, nullptr, exts);
 }
 
-static void loadXml(pugi::xml_document &xmlDoc, std::istream& model) {
-    OV_ITT_SCOPE(FIRST_INFERENCE, itt::domains::V10Reader_RT, "loadXml");
+CNNNetwork IRReader::read(std::istream& model, const Blob::CPtr& weights, const std::vector<IExtensionPtr>& exts) const {
+    OV_ITT_SCOPED_TASK(itt::domains::V7Reader, "IRReader::read");
+    pugi::xml_document xmlDoc;
     pugi::xml_parse_result res = xmlDoc.load(model);
     if (res.status != pugi::status_ok) {
         IE_THROW() << res.description() << "at offset " << res.offset;
     }
-}
-
-CNNNetwork IRReader::read(std::istream& model, const Blob::CPtr& weights, const std::vector<IExtensionPtr>& exts) const {
-    OV_ITT_SCOPED_TASK(itt::domains::V10Reader, "IRReader::read");
-
-    pugi::xml_document xmlDoc;
-    loadXml(xmlDoc, model);
     pugi::xml_node root = xmlDoc.document_element();
 
     auto version = details::GetIRVersion(root);
diff --git a/inference-engine/src/readers/ir_reader/ie_ir_reader.hpp b/inference-engine/src/readers/ir_reader_v7/ie_ir_reader.hpp
similarity index 100%
rename from inference-engine/src/readers/ir_reader/ie_ir_reader.hpp
rename to inference-engine/src/readers/ir_reader_v7/ie_ir_reader.hpp
diff --git a/inference-engine/src/readers/ir_reader/ie_ir_version.hpp b/inference-engine/src/readers/ir_reader_v7/ie_ir_version.hpp
similarity index 100%
rename from inference-engine/src/readers/ir_reader/ie_ir_version.hpp
rename to inference-engine/src/readers/ir_reader_v7/ie_ir_version.hpp
diff --git a/inference-engine/src/transformations/include/transformations/rt_info/nms_selected_indices.hpp b/inference-engine/src/transformations/include/transformations/rt_info/nms_selected_indices.hpp
new file mode 100644
index 00000000000..affdc026f0a
--- /dev/null
+++ b/inference-engine/src/transformations/include/transformations/rt_info/nms_selected_indices.hpp
@@ -0,0 +1,42 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <assert.h>
+#include <functional>
+#include <memory>
+#include <string>
+#include <set>
+
+#include <ngraph/node.hpp>
+#include <ngraph/variant.hpp>
+#include <transformations_visibility.hpp>
+
+namespace ov {
+
+class TRANSFORMATIONS_API NmsSelectedIndices {
+public:
+    NmsSelectedIndices() = default;
+};
+
+TRANSFORMATIONS_API bool has_nms_selected_indices(const Node * node);
+
+TRANSFORMATIONS_API void set_nms_selected_indices(Node * node);
+
+extern template class TRANSFORMATIONS_API VariantImpl<NmsSelectedIndices>;
+
+template<>
+class TRANSFORMATIONS_API VariantWrapper<NmsSelectedIndices> : public VariantImpl<NmsSelectedIndices> {
+public:
+    static constexpr VariantTypeInfo type_info{"NMS_SELECTED_INDICES", 0};
+
+    const VariantTypeInfo &get_type_info() const override {
+        return type_info;
+    }
+
+    VariantWrapper(const value_type &value) : VariantImpl<value_type>(value) {}
+
+    bool is_copyable() const override { return false; }
+};
+
+}  // namespace ov
diff --git a/inference-engine/src/transformations/src/transformations/common_optimizations/convert_nms_gather_path_to_unsigned.cpp b/inference-engine/src/transformations/src/transformations/common_optimizations/convert_nms_gather_path_to_unsigned.cpp
index 22cc9f3df28..8cf9091fcd5 100644
--- a/inference-engine/src/transformations/src/transformations/common_optimizations/convert_nms_gather_path_to_unsigned.cpp
+++ b/inference-engine/src/transformations/src/transformations/common_optimizations/convert_nms_gather_path_to_unsigned.cpp
@@ -12,6 +12,7 @@
 #include <ngraph/op/util/gather_base.hpp>
 #include <ngraph/rt_info.hpp>
 #include <memory>
+#include <transformations/rt_info/nms_selected_indices.hpp>
 #include "itt.hpp"
 #include "ngraph/node.hpp"
 
@@ -32,8 +33,7 @@ public:
         matcher_pass_callback callback = [=](pattern::Matcher &m) {
             const auto& out_nodes = m.get_match_root()->output(0).get_target_inputs();
             for (const auto& out_node : out_nodes) {
-                auto& out_rt_info = out_node.get_node()->get_rt_info();
-                out_rt_info["NMS_SELECTED_INDICES"] = make_shared<VariantWrapper<string>>("");
+                ov::set_nms_selected_indices(out_node.get_node());
             }
             return true;
         };
@@ -67,10 +67,9 @@ public:
             auto node = m.get_match_root();
             const auto & inputs = node->input_values();
             if (any_of(inputs.begin(), inputs.end(), [](const Output<Node> & output) {
-                return output.get_node()->get_rt_info().count("NMS_SELECTED_INDICES");
+                return ov::has_nms_selected_indices(output.get_node());
             })) {
-                auto & rt_info = node->get_rt_info();
-                rt_info["NMS_SELECTED_INDICES"] = make_shared<VariantWrapper<string>>("");
+                ov::set_nms_selected_indices(node.get());
             }
             return true;
         };
@@ -95,8 +94,7 @@ public:
             auto gather = m.get_match_root();
             auto indices = gather->input_value(1);
 
-            const auto& rt_info = indices.get_node()->get_rt_info();
-            if (!rt_info.count("NMS_SELECTED_INDICES"))
+            if (!ov::has_nms_selected_indices(indices.get_node()))
                 return false;
 
             auto out_type = (indices.get_element_type() == element::i64 ?  element::u64 : element::u32);
diff --git a/inference-engine/src/transformations/src/transformations/rt_info/nms_selected_indices.cpp b/inference-engine/src/transformations/src/transformations/rt_info/nms_selected_indices.cpp
new file mode 100644
index 00000000000..93de84cd24e
--- /dev/null
+++ b/inference-engine/src/transformations/src/transformations/rt_info/nms_selected_indices.cpp
@@ -0,0 +1,19 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "transformations/rt_info/nms_selected_indices.hpp"
+
+template class ov::VariantImpl<ov::NmsSelectedIndices>;
+
+constexpr ov::VariantTypeInfo ov::VariantWrapper<ov::NmsSelectedIndices>::type_info;
+
+void ov::set_nms_selected_indices(Node * node) {
+    auto & rt_info = node->get_rt_info();
+    rt_info[VariantWrapper<NmsSelectedIndices>::type_info.name] = make_variant<NmsSelectedIndices>({});
+}
+
+bool ov::has_nms_selected_indices(const Node * node) {
+    const auto & rt_info = node->get_rt_info();
+    return rt_info.count(VariantWrapper<NmsSelectedIndices>::type_info.name);
+}
diff --git a/inference-engine/src/vpu/graph_transformer/include/vpu/model/data_desc.hpp b/inference-engine/src/vpu/graph_transformer/include/vpu/model/data_desc.hpp
index 561fa5ce4da..7917348d028 100644
--- a/inference-engine/src/vpu/graph_transformer/include/vpu/model/data_desc.hpp
+++ b/inference-engine/src/vpu/graph_transformer/include/vpu/model/data_desc.hpp
@@ -433,7 +433,7 @@ public:
     // Convert from packed format to array of dimensions from minor to major.
     DimVector toPermutation() const;
 
-    // Get memory indeces for each dimension.
+    // Get memory indices for each dimension.
     DimValues toIndices() const;
 
     //
diff --git a/inference-engine/tests/functional/inference_engine/CMakeLists.txt b/inference-engine/tests/functional/inference_engine/CMakeLists.txt
index b6a91d48fd6..a2de4b7d892 100644
--- a/inference-engine/tests/functional/inference_engine/CMakeLists.txt
+++ b/inference-engine/tests/functional/inference_engine/CMakeLists.txt
@@ -13,6 +13,7 @@ set(LINK_LIBRARIES
     lptNgraphFunctions
     inference_engine_transformations
     openvino::itt
+    openvino::util
     openvino::conditional_compilation
     sharedTestClasses
     inference_engine_snippets
@@ -23,7 +24,7 @@ set(LINK_LIBRARIES
 
 set(DEPENDENCIES
     mock_engine
-    inference_engine_ir_reader
+    ir_ngraph_frontend
     inference_engine_ir_v7_reader
     HeteroPlugin
     MultiDevicePlugin
diff --git a/inference-engine/tests/functional/inference_engine/cnn_network/cnn_ngraph_impl_tests.cpp b/inference-engine/tests/functional/inference_engine/cnn_network/cnn_ngraph_impl_tests.cpp
index 40f19415754..4bdd53d7810 100644
--- a/inference-engine/tests/functional/inference_engine/cnn_network/cnn_ngraph_impl_tests.cpp
+++ b/inference-engine/tests/functional/inference_engine/cnn_network/cnn_ngraph_impl_tests.cpp
@@ -704,34 +704,115 @@ TEST(CNNNGraphImplTests, ReadMeanImageFromCNNNetReader) {
     InferenceEngine::Core core;
     size_t hwSize = 22*22;
     size_t dataSize = hwSize*3;
-    Blob::Ptr data = make_shared_blob<float>(TensorDesc(Precision::FP32, {dataSize}, Layout::C));
-    data->allocate();
+    Blob::Ptr weights = make_shared_blob<float>(TensorDesc(Precision::FP32, {dataSize}, Layout::C));
+    weights->allocate();
     {
-        auto lockData = data->buffer();
+        auto lockData = weights->buffer();
         float *dataPtr = lockData.as<float*>();
 
         for (size_t i = 0; i < dataSize; ++i) {
-            dataPtr[i] = i;
+            dataPtr[i] = 1;
         }
     }
-    CNNNetwork network = core.ReadNetwork(model, data);
-    ASSERT_EQ(3, network.layerCount());
-    auto inputInfo = network.getInputsInfo().begin()->second;
-    ASSERT_NE(inputInfo, nullptr);
-    auto preProc = inputInfo->getPreProcess();
-    ASSERT_EQ(3, preProc.getNumberOfChannels());
-    ASSERT_EQ(preProc.getMeanVariant(), MeanVariant::MEAN_IMAGE);
+    CNNNetwork network = core.ReadNetwork(model, weights);
+    auto f = network.getFunction();
 
-    for (size_t i = 0; i < preProc.getNumberOfChannels(); i++) {
-        auto chMeanImg = preProc[i];
-        ASSERT_NE(chMeanImg, nullptr);
-        ASSERT_NE(chMeanImg->meanData, nullptr);
-        auto lockData = chMeanImg->meanData->cbuffer();
-        auto *dataPtr = lockData.as<const float*>();
-        for (size_t j = 0; j < hwSize; j++) {
-            ASSERT_EQ(dataPtr[j], hwSize*i + j);
-        }
+    std::shared_ptr<ngraph::Function> f_ref;
+    {
+        auto data = std::make_shared<ngraph::opset1::Parameter>(ngraph::element::f32, ngraph::Shape{1, 3, 22, 22});
+        auto mean_image = ngraph::opset1::Constant::create(ngraph::element::f32, ngraph::Shape{3, 22, 22}, {1});
+        auto sub = std::make_shared<ngraph::opset1::Subtract>(data, mean_image);
+        auto relu = std::make_shared<ngraph::opset1::Relu>(sub);
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{relu}, ngraph::ParameterVector{data});
     }
+
+    const auto fc = FunctionsComparator::with_default()
+                        .enable(FunctionsComparator::ATTRIBUTES)
+                        .enable(FunctionsComparator::CONST_VALUES);
+    const auto res = fc.compare(f, f_ref);
+    EXPECT_TRUE(res.valid) << res.message;
+}
+
+TEST(CNNNGraphImplTests, ReadMeanValueFromCNNNetReader) {
+    std::string model = R"V0G0N(
+<net name="Activation" version="10">
+    <pre-process mean-precision="FP32" reference-layer-name="data">
+        <channel id="0">
+            <mean value="1.1"/>
+        </channel>
+        <channel id="1">
+            <mean value="2.2"/>
+        </channel>
+        <channel id="2">
+            <mean value="3.3"/>
+        </channel>
+    </pre-process>
+    <layers>
+        <layer name="data" type="Parameter" id="0" version="opset1">
+            <data shape="1,3,22,22" element_type="f32"/>
+            <output>
+                <port id="0" precision="FP32">
+                    <dim>1</dim>
+                    <dim>3</dim>
+                    <dim>22</dim>
+                    <dim>22</dim>
+                </port>
+            </output>
+        </layer>
+        <layer name="activation" id="1" type="ReLU" version="opset1">
+            <input>
+                <port id="1" precision="FP32">
+                    <dim>1</dim>
+                    <dim>3</dim>
+                    <dim>22</dim>
+                    <dim>22</dim>
+                </port>
+            </input>
+            <output>
+                <port id="2" precision="FP32">
+                    <dim>1</dim>
+                    <dim>3</dim>
+                    <dim>22</dim>
+                    <dim>22</dim>
+                </port>
+            </output>
+        </layer>
+        <layer name="output" type="Result" id="2" version="opset1">
+            <input>
+                <port id="0" precision="FP32">
+                    <dim>1</dim>
+                    <dim>3</dim>
+                    <dim>22</dim>
+                    <dim>22</dim>
+                </port>
+            </input>
+        </layer>
+    </layers>
+    <edges>
+        <edge from-layer="0" from-port="0" to-layer="1" to-port="1"/>
+        <edge from-layer="1" from-port="2" to-layer="2" to-port="0"/>
+    </edges>
+</net>
+)V0G0N";
+    InferenceEngine::Core core;
+    Blob::Ptr weights{nullptr};
+    CNNNetwork network = core.ReadNetwork(model, weights);
+    auto f = network.getFunction();
+
+    std::shared_ptr<ngraph::Function> f_ref;
+    {
+        auto data = std::make_shared<ngraph::opset1::Parameter>(ngraph::element::f32, ngraph::Shape{1, 3, 22, 22});
+        auto mean_image = ngraph::opset1::Constant::create(ngraph::element::f32, ngraph::Shape{3, 1, 1}, {1.1, 2.2, 3.3});
+        auto sub = std::make_shared<ngraph::opset1::Subtract>(data, mean_image);
+        auto relu = std::make_shared<ngraph::opset1::Relu>(sub);
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{relu}, ngraph::ParameterVector{data});
+    }
+
+    const auto fc = FunctionsComparator::with_default()
+            .enable(FunctionsComparator::ATTRIBUTES)
+            .enable(FunctionsComparator::CONST_VALUES);
+    const auto res = fc.compare(f, f_ref);
+    EXPECT_TRUE(res.valid) << res.message;
 }
 
 TEST(CNNNGraphImplTests, CanChangeInputPrecision) {
diff --git a/inference-engine/tests/functional/inference_engine/core_threading_tests.cpp b/inference-engine/tests/functional/inference_engine/core_threading_tests.cpp
index 791cb220093..c59e3538bbc 100644
--- a/inference-engine/tests/functional/inference_engine/core_threading_tests.cpp
+++ b/inference-engine/tests/functional/inference_engine/core_threading_tests.cpp
@@ -95,16 +95,16 @@ TEST_F(CoreThreadingTests, RegisterPlugins) {
     auto getPluginXml = [&] () -> std::tuple<std::string, std::string> {
         std::string indexStr = std::to_string(index++);
         std::string pluginsXML = InferenceEngine::getIELibraryPath() +
-            FileUtils::FileSeparator +
+            ov::util::FileTraits<char>::file_separator +
             "test_plugins" + indexStr + ".xml";
         std::ofstream file(pluginsXML);
 
         file << "<ie><plugins><plugin location=\"";
-        file << FileUtils::FileTraits<char>::PluginLibraryPrefix();
+        file << ov::util::FileTraits<char>::library_prefix();
         file << "mock_engine";
         file << IE_BUILD_POSTFIX;
-        file << FileUtils::DotSymbol<char>::value;
-        file << FileUtils::FileTraits<char>::PluginLibraryExt();
+        file << ov::util::FileTraits<char>::dot_symbol;
+        file << ov::util::FileTraits<char>::library_ext();
         file << "\" name=\"";
         file << indexStr;
         file << "\"></plugin></plugins></ie>";
diff --git a/inference-engine/tests/functional/inference_engine/ir_serialization/custom_ops.cpp b/inference-engine/tests/functional/inference_engine/ir_serialization/custom_ops.cpp
index 0c38683a081..db0303280cb 100644
--- a/inference-engine/tests/functional/inference_engine/ir_serialization/custom_ops.cpp
+++ b/inference-engine/tests/functional/inference_engine/ir_serialization/custom_ops.cpp
@@ -123,6 +123,10 @@ public:
         versionInfo = &ExtensionDescription;
     }
 
+    std::map<std::string, ngraph::OpSet> getOpSets() override {
+        return {{"framework_node_ext", ngraph::OpSet()}};
+    }
+
     void Unload() noexcept override {}
 };
 
diff --git a/inference-engine/tests/functional/inference_engine/ir_serialization/serialize.cpp b/inference-engine/tests/functional/inference_engine/ir_serialization/serialize.cpp
index 5bec0de3dd0..e1c743f1e65 100644
--- a/inference-engine/tests/functional/inference_engine/ir_serialization/serialize.cpp
+++ b/inference-engine/tests/functional/inference_engine/ir_serialization/serialize.cpp
@@ -50,10 +50,11 @@ TEST_P(SerializationTest, CompareFunctions) {
     expected.serialize(m_out_xml_path, m_out_bin_path);
     auto result = ie.ReadNetwork(m_out_xml_path, m_out_bin_path);
 
-    bool success;
-    std::string message;
-    std::tie(success, message) = compare_functions(result.getFunction(), expected.getFunction(), true, false, true, true, true);
-    ASSERT_TRUE(success) << message;
+    const auto fc = FunctionsComparator::with_default()
+            .enable(FunctionsComparator::ATTRIBUTES)
+            .enable(FunctionsComparator::CONST_VALUES);
+    const auto res = fc.compare(result.getFunction(), expected.getFunction());
+    EXPECT_TRUE(res.valid) << res.message;
 }
 
 INSTANTIATE_TEST_SUITE_P(IRSerialization, SerializationTest,
diff --git a/inference-engine/tests/functional/inference_engine/ir_serialization/tensor_names.cpp b/inference-engine/tests/functional/inference_engine/ir_serialization/tensor_names.cpp
index 0cc7728e1b4..0cc47bcf7cc 100644
--- a/inference-engine/tests/functional/inference_engine/ir_serialization/tensor_names.cpp
+++ b/inference-engine/tests/functional/inference_engine/ir_serialization/tensor_names.cpp
@@ -49,10 +49,9 @@ TEST_F(TensorNameSerializationTest, SerializeFunctionWithTensorNames) {
     expected.serialize(m_out_xml_path, m_out_bin_path);
     auto result = ie.ReadNetwork(m_out_xml_path, m_out_bin_path);
 
-    bool success;
-    std::string message;
-    std::tie(success, message) =
-        compare_functions(result.getFunction(), expected.getFunction(), true, true, true, true);
-
-    ASSERT_TRUE(success) << message;
+    const auto fc = FunctionsComparator::with_default()
+            .enable(FunctionsComparator::ATTRIBUTES)
+            .enable(FunctionsComparator::CONST_VALUES);
+    const auto res = fc.compare(result.getFunction(), expected.getFunction());
+    EXPECT_TRUE(res.valid) << res.message;
 }
diff --git a/inference-engine/tests/functional/inference_engine/lp_transformations/fake_quantize_transformation.cpp b/inference-engine/tests/functional/inference_engine/lp_transformations/fake_quantize_transformation.cpp
index cef8f87a01e..5ddca1d707f 100644
--- a/inference-engine/tests/functional/inference_engine/lp_transformations/fake_quantize_transformation.cpp
+++ b/inference-engine/tests/functional/inference_engine/lp_transformations/fake_quantize_transformation.cpp
@@ -14,6 +14,7 @@
 #include <low_precision/avg_pool.hpp>
 #include <low_precision/common/operation_precision_restriction.hpp>
 #include <low_precision/fake_quantize_decomposition.hpp>
+#include <low_precision/low_precision.hpp>
 #include "common_test_utils/ngraph_test_utils.hpp"
 
 #include "lpt_ngraph_functions/fake_quantize_function.hpp"
@@ -85,6 +86,14 @@ public:
 
         const auto params = TestTransformationParams(fakeQuantizeOnData.params).setUpdatePrecisions(updatePrecision);
 
+        if (fakeQuantizeOnData.actual.quantizationLevel != 256) {
+            low_precision::LowPrecision::setDefaultPrecisions({
+                 ngraph::element::u8, ngraph::element::i8,
+                 ngraph::element::u16, ngraph::element::i16,
+                 ngraph::element::u32, ngraph::element::i32
+            });
+        }
+
         actualFunction = ngraph::builder::subgraph::FakeQuantizeFunction::getOriginal(
             TestTransformationParams::toParams(fakeQuantizeOnData.params),
             precision,
@@ -252,7 +261,50 @@ const std::vector<FakeQuantizeTransformationTestValues> fakeQuantizeTransformati
             { ngraph::element::f16, {{ngraph::element::f16}, { }, { 1e-32f }} }
         }
     },
-
+    // U16
+    {
+        LayerTransformation::createParamsU8I8(),
+        { 65536ul, {}, { 0.f }, { 65.535f }, { 0.f }, { 65.535f } },
+        { 65536ul, {}, { 0.f }, { 65.535f }, { 0.f }, { 65535.f } },
+        ngraph::element::u16,
+        {
+            { ngraph::element::f32, { {ngraph::element::f32}, {}, { 0.001f }} },
+            { ngraph::element::f16, { {ngraph::element::f16}, {}, { 0.001f }} }
+        }
+    },
+    // I16
+    {
+        LayerTransformation::createParamsU8I8(),
+        { 65536ul, {}, { -32.768f }, { 32.767f }, { -32.768f }, { 32.767f } },
+        { 65536ul, {}, { -32.768f }, { 32.767f }, { -32768.f }, { 32767.f } },
+        ngraph::element::i16,
+        {
+            { ngraph::element::f32, { {ngraph::element::f32}, {}, { 0.001f }} },
+            { ngraph::element::f16, { {ngraph::element::f16}, {}, { 0.001f }} }
+        }
+    },
+    // U32
+    {
+        LayerTransformation::createParamsU8I8(),
+        { static_cast<size_t>(4294967296), {}, { 0.f }, { 4.294967295f }, { 0.f }, { 4.294967295f } },
+        { static_cast<size_t>(4294967296), {}, { 0.f }, { 4.294967295f }, { 0.f }, { 4294967295.f } },
+        ngraph::element::u32,
+        {
+            { ngraph::element::f32, { {ngraph::element::f32}, {}, { 0.000000001f }} },
+            { ngraph::element::f16, { {ngraph::element::f16}, {}, { 0.000000001f }} }
+        }
+    },
+    // I32
+    {
+        LayerTransformation::createParamsU8I8(),
+        { static_cast<size_t>(4294967296), {}, { -2.147483648f }, { 2.147483647f }, { -2.147483648f }, { 2.147483647f } },
+        { static_cast<size_t>(4294967296), {}, { -2.147483648f }, { 2.147483647f }, { -2147483648.f }, { 2147483647.f } },
+        ngraph::element::i32,
+        {
+            { ngraph::element::f32, { {ngraph::element::f32}, {}, { 0.000000001f }} },
+            { ngraph::element::f16, { {ngraph::element::f16}, {}, { 0.000000001f }} }
+        }
+    },
     // Failed when updatePrecisions = false, U8 per-channel
     //{
     //    LayerTransformation::createParamsU8I8(),
diff --git a/inference-engine/tests/functional/inference_engine/lp_transformations/get_dequantization_transformation.cpp b/inference-engine/tests/functional/inference_engine/lp_transformations/get_dequantization_transformation.cpp
index 1e69ae86bc8..3bd9c4fed9d 100644
--- a/inference-engine/tests/functional/inference_engine/lp_transformations/get_dequantization_transformation.cpp
+++ b/inference-engine/tests/functional/inference_engine/lp_transformations/get_dequantization_transformation.cpp
@@ -21,13 +21,14 @@
 using namespace testing;
 using namespace ngraph;
 using namespace ngraph::pass;
+using namespace ngraph::builder::subgraph;
 
 class GetDequantizationTestValues {
 public:
-    builder::subgraph::FakeQuantizeOnData fakeQuantize;
+    FakeQuantizeOnData fakeQuantize;
     // actual dequantization to create nGraph function to run NetworkHelper::getDequantization
-    builder::subgraph::DequantizationOperations actualDequantization;
-    builder::subgraph::DequantizationOperations expectedDequantization;
+    DequantizationOperations actualDequantization;
+    DequantizationOperations expectedDequantization;
 };
 
 inline std::ostream& operator<<(std::ostream& os, const std::vector<float>& values) {
@@ -58,7 +59,7 @@ public:
         const ngraph::Shape shape = std::get<1>(GetParam());
         const GetDequantizationTestValues testValues = std::get<2>(GetParam());
 
-        actualFunction = ngraph::builder::subgraph::GetDequantizationFunction::get(
+        actualFunction = GetDequantizationFunction::get(
             precision,
             shape,
             testValues.fakeQuantize,
@@ -85,7 +86,7 @@ TEST_P(GetDequantizationTransformation, CompareFunctions) {
 
     const auto output = actualFunction->get_output_op(0);
     const ngraph::pass::low_precision::FakeQuantizeDequantization dequantization = ngraph::pass::low_precision::NetworkHelper::getDequantization(output);
-    ngraph::builder::subgraph::DequantizationOperations actualDequantization = toDequantizationOperations(dequantization);
+    DequantizationOperations actualDequantization = toDequantizationOperations(dequantization);
     actualDequantization.subtract.constantShapeIsDefined = testValues.expectedDequantization.subtract.constantShapeIsDefined;
     actualDequantization.subtract.outPrecision = testValues.expectedDequantization.subtract.outPrecision;
     actualDequantization.multiply.constantShapeIsDefined = testValues.expectedDequantization.multiply.constantShapeIsDefined;
@@ -93,7 +94,7 @@ TEST_P(GetDequantizationTransformation, CompareFunctions) {
     ASSERT_TRUE(actualDequantization == testValues.expectedDequantization);
 }
 
-const std::vector<ngraph::element::Type> precisions = {
+const element::TypeVector precisions = {
     ngraph::element::f32,
 };
 
@@ -147,6 +148,16 @@ const std::vector<GetDequantizationTestValues> testValues = {
             {{ 127.f }, ngraph::element::f32, {}, false, 0, ngraph::element::u8, true},
             {{ 0.1f }, ngraph::element::f32, {}, false, 0},
         }
+    },
+    {
+        // unexpected precision (non dequantization operations)
+        {},
+        {
+            ngraph::element::i32,
+            DequantizationOperations::Subtract{ 32 }.setConstantPrecision(element::i32),
+            DequantizationOperations::Multiply{ 2 }.setConstantPrecision(element::i32),
+        },
+        {}
     }
 };
 
diff --git a/inference-engine/tests/functional/inference_engine/lp_transformations/multiply_to_group_convolution_transformation.cpp b/inference-engine/tests/functional/inference_engine/lp_transformations/multiply_to_group_convolution_transformation.cpp
index aab9028a6c6..50e8bd8cc9d 100644
--- a/inference-engine/tests/functional/inference_engine/lp_transformations/multiply_to_group_convolution_transformation.cpp
+++ b/inference-engine/tests/functional/inference_engine/lp_transformations/multiply_to_group_convolution_transformation.cpp
@@ -276,7 +276,7 @@ const std::vector<MultiplyToGroupConvolutionTransformationTestValues> testValues
             ngraph::element::u8,
             {
                 {},
-                {{1.f, 2.f, 3.f, 4.f}, ngraph::element::f32},
+                DequantizationOperations::Subtract{{1.f, 2.f, 3.f, 4.f}, element::f32}.setConstantPrecision(element::f32),
                 {{0.45f, 0.82f, 0.71f, 0.37f}}
             }
         },
@@ -301,7 +301,7 @@ const std::vector<MultiplyToGroupConvolutionTransformationTestValues> testValues
             ngraph::element::u8,
             {
                 {},
-                {{1.f, 2.f, 3.f, 4.f}, ngraph::element::f32},
+                DequantizationOperations::Subtract{{1.f, 2.f, 3.f, 4.f}, element::f32}.setConstantPrecision(element::f32),
                 {{0.45f, 0.82f, 0.71f, 0.37f}}
             }
         },
diff --git a/inference-engine/tests/functional/inference_engine/lp_transformations/reshape_transformation.cpp b/inference-engine/tests/functional/inference_engine/lp_transformations/reshape_transformation.cpp
index 38502dc6834..a011f0ff010 100644
--- a/inference-engine/tests/functional/inference_engine/lp_transformations/reshape_transformation.cpp
+++ b/inference-engine/tests/functional/inference_engine/lp_transformations/reshape_transformation.cpp
@@ -955,7 +955,23 @@ const std::vector<ReshapeTransformationTestValues> testValues = {
                 {{0.1f,  0.02f, 0.1f, 0.02f, 0.1f, 0.02f}, ngraph::element::f32, {1, 6}}
             }
         }
-    }
+    },
+    // Nondequantization multiply (I32 precision)
+    {
+        { 1, 384, 1024 },
+        { 1, 384, 16, 64 },
+        LayerTransformation::createParamsU8I8(),
+        {
+            ngraph::element::i32,
+            {{}, {}, {2}}
+        },
+        {
+            ngraph::element::i32,
+            {{}, {}, {2}},
+            ngraph::element::i32,
+            {}
+        }
+    },
 };
 
 INSTANTIATE_TEST_SUITE_P(
diff --git a/inference-engine/tests/functional/inference_engine/ngraph_reader/net_reader_test.cpp b/inference-engine/tests/functional/inference_engine/ngraph_reader/net_reader_test.cpp
index d32b6ab07de..c9868fc01df 100644
--- a/inference-engine/tests/functional/inference_engine/ngraph_reader/net_reader_test.cpp
+++ b/inference-engine/tests/functional/inference_engine/ngraph_reader/net_reader_test.cpp
@@ -85,12 +85,12 @@ TEST_P(NetReaderTest, ReadCorrectModelWithWeightsUnicodePath) {
             is_copy_successfully = CommonTestUtils::copyFile(_modelPath, modelPath);
             if (!is_copy_successfully) {
                 FAIL() << "Unable to copy from '" << _modelPath << "' to '"
-                       << FileUtils::wStringtoMBCSstringChar(modelPath) << "'";
+                       << ov::util::wstring_to_string(modelPath) << "'";
             }
             is_copy_successfully = CommonTestUtils::copyFile(_weightsPath, weightsPath);
             if (!is_copy_successfully) {
                 FAIL() << "Unable to copy from '" << _weightsPath << "' to '"
-                       << FileUtils::wStringtoMBCSstringChar(weightsPath) << "'";
+                       << ov::util::wstring_to_string(weightsPath) << "'";
             }
             GTEST_COUT << "Test " << testIndex << std::endl;
             InferenceEngine::Core ie;
diff --git a/inference-engine/tests/functional/inference_engine/ngraph_reshape_tests.cpp b/inference-engine/tests/functional/inference_engine/ngraph_reshape_tests.cpp
index 5c8885d7cf7..59d19455011 100644
--- a/inference-engine/tests/functional/inference_engine/ngraph_reshape_tests.cpp
+++ b/inference-engine/tests/functional/inference_engine/ngraph_reshape_tests.cpp
@@ -364,14 +364,17 @@ public:
     }
 
     void validate_and_infer_types() override {
-        auto input_shape = get_input_partial_shape(0).to_shape();
-
-        ngraph::Shape output_shape(input_shape);
-        for (int i = 0; i < input_shape.size(); ++i) {
-            output_shape[i] = input_shape[i] * test2 + (test1 ? 0 : 1);
+        auto input_pshape = get_input_partial_shape(0);
+        if (input_pshape.is_static()) {
+            auto input_shape = input_pshape.to_shape();
+            ngraph::Shape output_shape(input_shape);
+            for (int i = 0; i < input_shape.size(); ++i) {
+                output_shape[i] = input_shape[i] * test2 + (test1 ? 0 : 1);
+            }
+            set_output_type(0, get_input_element_type(0), ngraph::PartialShape(output_shape));
+        } else {
+            set_output_type(0, get_input_element_type(0), ngraph::PartialShape::dynamic());
         }
-
-        set_output_type(0, get_input_element_type(0), ngraph::PartialShape(output_shape));
     }
 
     std::shared_ptr<ngraph::Node> clone_with_new_inputs(const ngraph::OutputVector& new_args) const override {
diff --git a/inference-engine/tests/functional/inference_engine/onnx_reader/onnx_reader_external_data.cpp b/inference-engine/tests/functional/inference_engine/onnx_reader/onnx_reader_external_data.cpp
index 70b0e7537cc..395274a627d 100644
--- a/inference-engine/tests/functional/inference_engine/onnx_reader/onnx_reader_external_data.cpp
+++ b/inference-engine/tests/functional/inference_engine/onnx_reader/onnx_reader_external_data.cpp
@@ -86,7 +86,7 @@ TEST(ONNX_Reader_Tests, ImportModelWithExternalDataFromWstringNamedFile) {
     bool is_copy_successfully = CommonTestUtils::copyFile(win_dir_path, wmodel);
     if (!is_copy_successfully) {
         FAIL() << "Unable to copy from '" << win_dir_path << "' to '"
-                << FileUtils::wStringtoMBCSstringChar(wmodel) << "'";
+                << ov::util::wstring_to_string(wmodel) << "'";
     }
 
     auto cnnNetwork = ie.ReadNetwork(wmodel, L"");
diff --git a/inference-engine/tests/functional/inference_engine/ov_executable_network_test.cpp b/inference-engine/tests/functional/inference_engine/ov_executable_network_test.cpp
index 7c4e3ce7d26..a6315314ee3 100644
--- a/inference-engine/tests/functional/inference_engine/ov_executable_network_test.cpp
+++ b/inference-engine/tests/functional/inference_engine/ov_executable_network_test.cpp
@@ -3,6 +3,7 @@
 //
 
 #include <gtest/gtest.h>
+#include <openvino/core/except.hpp>
 #include <openvino/runtime/executable_network.hpp>
 
 using namespace ::testing;
@@ -10,40 +11,40 @@ using namespace std;
 
 TEST(ExecutableNetworkOVTests, throwsOnUninitializedExportStream) {
     ov::runtime::ExecutableNetwork exec;
-    ASSERT_THROW(exec.export_model(std::cout), InferenceEngine::NotAllocated);
+    ASSERT_THROW(exec.export_model(std::cout), ov::Exception);
 }
 
 TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetFunction) {
     ov::runtime::ExecutableNetwork exec;
-    ASSERT_THROW(exec.get_runtime_function(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(exec.get_runtime_function(), ov::Exception);
 }
 
 TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetParameters) {
     ov::runtime::ExecutableNetwork exec;
-    ASSERT_THROW(exec.get_parameters(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(exec.get_parameters(), ov::Exception);
 }
 
 TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetResults) {
     ov::runtime::ExecutableNetwork exec;
-    ASSERT_THROW(exec.get_results(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(exec.get_results(), ov::Exception);
 }
 
 TEST(ExecutableNetworkOVTests, throwsOnUninitializedSetConfig) {
     ov::runtime::ExecutableNetwork exec;
-    ASSERT_THROW(exec.set_config({{}}), InferenceEngine::NotAllocated);
+    ASSERT_THROW(exec.set_config({{}}), ov::Exception);
 }
 
 TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetConfig) {
     ov::runtime::ExecutableNetwork exec;
-    ASSERT_THROW(exec.get_config({}), InferenceEngine::NotAllocated);
+    ASSERT_THROW(exec.get_config({}), ov::Exception);
 }
 
 TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetMetric) {
     ov::runtime::ExecutableNetwork exec;
-    ASSERT_THROW(exec.get_metric({}), InferenceEngine::NotAllocated);
+    ASSERT_THROW(exec.get_metric({}), ov::Exception);
 }
 
 TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetContext) {
     ov::runtime::ExecutableNetwork exec;
-    ASSERT_THROW(exec.get_context(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(exec.get_context(), ov::Exception);
 }
\ No newline at end of file
diff --git a/inference-engine/tests/functional/inference_engine/ov_infer_request_test.cpp b/inference-engine/tests/functional/inference_engine/ov_infer_request_test.cpp
index 1cfdb17941c..bad26ae73a0 100644
--- a/inference-engine/tests/functional/inference_engine/ov_infer_request_test.cpp
+++ b/inference-engine/tests/functional/inference_engine/ov_infer_request_test.cpp
@@ -5,6 +5,7 @@
 #include <gtest/gtest.h>
 
 #include <cpp/ie_infer_request.hpp>
+#include <openvino/core/except.hpp>
 #include <openvino/runtime/infer_request.hpp>
 
 using namespace ::testing;
@@ -15,61 +16,61 @@ using namespace InferenceEngine::details;
 
 TEST(InferRequestOVTests, throwsOnUninitializedSetBlob) {
     ov::runtime::InferRequest req;
-    ASSERT_THROW(req.set_blob({}, {}), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.set_blob({}, {}), ov::Exception);
 }
 
 TEST(InferRequestOVTests, throwsOnUninitializedGetBlob) {
     ov::runtime::InferRequest req;
-    ASSERT_THROW(req.get_blob({}), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.get_blob({}), ov::Exception);
 }
 
 TEST(InferRequestOVTests, throwsOnUninitializedInfer) {
     ov::runtime::InferRequest req;
-    ASSERT_THROW(req.infer(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.infer(), ov::Exception);
 }
 
 TEST(InferRequestOVTests, throwsOnUninitializedGetPerformanceCounts) {
     ov::runtime::InferRequest req;
-    ASSERT_THROW(req.get_profiling_info(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.get_profiling_info(), ov::Exception);
 }
 
 TEST(InferRequestOVTests, throwsOnUninitializedSetInput) {
     ov::runtime::InferRequest req;
-    ASSERT_THROW(req.set_input({{}}), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.set_input({{}}), ov::Exception);
 }
 
 TEST(InferRequestOVTests, throwsOnUninitializedSetOutput) {
     ov::runtime::InferRequest req;
-    ASSERT_THROW(req.set_output({{}}), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.set_output({{}}), ov::Exception);
 }
 
 TEST(InferRequestOVTests, throwsOnUninitializedSetBatch) {
     ov::runtime::InferRequest req;
-    ASSERT_THROW(req.set_batch({}), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.set_batch({}), ov::Exception);
 }
 
 TEST(InferRequestOVTests, throwsOnUninitializedStartAsync) {
     ov::runtime::InferRequest req;
-    ASSERT_THROW(req.start_async(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.start_async(), ov::Exception);
 }
 
 TEST(InferRequestOVTests, throwsOnUninitializedWait) {
     ov::runtime::InferRequest req;
-    ASSERT_THROW(req.wait(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.wait(), ov::Exception);
 }
 
 TEST(InferRequestOVTests, throwsOnUninitializedWaitFor) {
     ov::runtime::InferRequest req;
-    ASSERT_THROW(req.wait_for({}), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.wait_for({}), ov::Exception);
 }
 
 TEST(InferRequestOVTests, throwsOnUninitializedSetCompletionCallback) {
     ov::runtime::InferRequest req;
     std::function<void(std::exception_ptr)> f;
-    ASSERT_THROW(req.set_callback(f), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.set_callback(f), ov::Exception);
 }
 
 TEST(InferRequestOVTests, throwsOnUninitializedQueryState) {
     ov::runtime::InferRequest req;
-    ASSERT_THROW(req.query_state(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(req.query_state(), ov::Exception);
 }
diff --git a/inference-engine/tests/functional/inference_engine/ov_remote_context_test.cpp b/inference-engine/tests/functional/inference_engine/ov_remote_context_test.cpp
index 2e649082aeb..86e786ebe4d 100644
--- a/inference-engine/tests/functional/inference_engine/ov_remote_context_test.cpp
+++ b/inference-engine/tests/functional/inference_engine/ov_remote_context_test.cpp
@@ -4,6 +4,7 @@
 
 #include <gtest/gtest.h>
 
+#include <openvino/core/except.hpp>
 #include <openvino/runtime/remote_context.hpp>
 
 using namespace ::testing;
@@ -11,15 +12,15 @@ using namespace std;
 
 TEST(RemoteContextOVTests, throwsOnUninitializedReset) {
     ov::runtime::RemoteContext ctx;
-    ASSERT_THROW(ctx.get_device_name(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(ctx.get_device_name(), ov::Exception);
 }
 
 TEST(RemoteContextOVTests, throwsOnUninitializedGetname) {
     ov::runtime::RemoteContext ctx;
-    ASSERT_THROW(ctx.create_blob({}, {}), InferenceEngine::NotAllocated);
+    ASSERT_THROW(ctx.create_blob({}, {}), ov::Exception);
 }
 
 TEST(RemoteContextOVTests, throwsOnUninitializedGetParams) {
     ov::runtime::RemoteContext ctx;
-    ASSERT_THROW(ctx.get_params(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(ctx.get_params(), ov::Exception);
 }
diff --git a/inference-engine/tests/functional/inference_engine/ov_variable_state_test.cpp b/inference-engine/tests/functional/inference_engine/ov_variable_state_test.cpp
index f9233e5eebc..e29e881fa01 100644
--- a/inference-engine/tests/functional/inference_engine/ov_variable_state_test.cpp
+++ b/inference-engine/tests/functional/inference_engine/ov_variable_state_test.cpp
@@ -4,6 +4,7 @@
 
 #include <gtest/gtest.h>
 
+#include <openvino/core/except.hpp>
 #include <openvino/runtime/variable_state.hpp>
 
 using namespace ::testing;
@@ -11,21 +12,21 @@ using namespace std;
 
 TEST(VariableStateOVTests, throwsOnUninitializedReset) {
     ov::runtime::VariableState state;
-    ASSERT_THROW(state.reset(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(state.reset(), ov::Exception);
 }
 
 TEST(VariableStateOVTests, throwsOnUninitializedGetname) {
     ov::runtime::VariableState state;
-    ASSERT_THROW(state.get_name(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(state.get_name(), ov::Exception);
 }
 
 TEST(VariableStateOVTests, throwsOnUninitializedGetState) {
     ov::runtime::VariableState state;
-    ASSERT_THROW(state.get_state(), InferenceEngine::NotAllocated);
+    ASSERT_THROW(state.get_state(), ov::Exception);
 }
 
 TEST(VariableStateOVTests, throwsOnUninitializedSetState) {
     ov::runtime::VariableState state;
     InferenceEngine::Blob::Ptr blob;
-    ASSERT_THROW(state.set_state(blob), InferenceEngine::NotAllocated);
+    ASSERT_THROW(state.set_state(blob), ov::Exception);
 }
diff --git a/inference-engine/tests/functional/inference_engine/paddle_reader/read_paddle_model_test.cpp b/inference-engine/tests/functional/inference_engine/paddle_reader/read_paddle_model_test.cpp
index ead189023f2..b3c21d19cc4 100644
--- a/inference-engine/tests/functional/inference_engine/paddle_reader/read_paddle_model_test.cpp
+++ b/inference-engine/tests/functional/inference_engine/paddle_reader/read_paddle_model_test.cpp
@@ -55,7 +55,7 @@ TEST(PDPD_Reader_Tests, ImportBasicModelToCoreWstring) {
     bool is_copy_successfully = CommonTestUtils::copyFile(win_dir_path, wmodel);
     if (!is_copy_successfully) {
         FAIL() << "Unable to copy from '" << win_dir_path << "' to '"
-                << FileUtils::wStringtoMBCSstringChar(wmodel) << "'";
+                << ov::util::wstring_to_string(wmodel) << "'";
     }
     InferenceEngine::Core ie;
     auto cnnNetwork = ie.ReadNetwork(wmodel);
diff --git a/inference-engine/tests/functional/inference_engine/parameter_tests.cpp b/inference-engine/tests/functional/inference_engine/parameter_tests.cpp
index 49c72cad916..16ed9c339ff 100644
--- a/inference-engine/tests/functional/inference_engine/parameter_tests.cpp
+++ b/inference-engine/tests/functional/inference_engine/parameter_tests.cpp
@@ -275,10 +275,10 @@ TEST_F(ParameterTests, CompareParametersWithoutEqualOperator) {
     Parameter parB = b;
     Parameter parC = c;
 
-    ASSERT_THROW((void)(parA == parB), Exception);
-    ASSERT_THROW((void)(parA != parB), Exception);
-    ASSERT_THROW((void)(parA == parC), Exception);
-    ASSERT_THROW((void)(parA != parC), Exception);
+    ASSERT_THROW((void)(parA == parB), ov::Exception);
+    ASSERT_THROW((void)(parA != parB), ov::Exception);
+    ASSERT_THROW((void)(parA == parC), ov::Exception);
+    ASSERT_THROW((void)(parA != parC), ov::Exception);
 }
 
 TEST_F(ParameterTests, ParameterRemovedRealObject) {
diff --git a/inference-engine/tests/functional/plugin/conformance/CMakeLists.txt b/inference-engine/tests/functional/plugin/conformance/CMakeLists.txt
index 74888b818c3..4f3727dcad5 100644
--- a/inference-engine/tests/functional/plugin/conformance/CMakeLists.txt
+++ b/inference-engine/tests/functional/plugin/conformance/CMakeLists.txt
@@ -2,6 +2,8 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
-add_subdirectory(test_runner)
+add_subdirectory(test_runner/conformance_infra)
+add_subdirectory(test_runner/api_conformance_runner)
+add_subdirectory(test_runner/op_conformance_runner)
 add_subdirectory(subgraphs_dumper)
 add_subdirectory(subgraphs_dumper/tests)
diff --git a/inference-engine/tests/functional/plugin/conformance/subgraphs_dumper/CMakeLists.txt b/inference-engine/tests/functional/plugin/conformance/subgraphs_dumper/CMakeLists.txt
index 04709b9c841..3524f94b847 100644
--- a/inference-engine/tests/functional/plugin/conformance/subgraphs_dumper/CMakeLists.txt
+++ b/inference-engine/tests/functional/plugin/conformance/subgraphs_dumper/CMakeLists.txt
@@ -11,7 +11,7 @@ addIeTargetTest(
             ${CMAKE_CURRENT_SOURCE_DIR}/include
             $<TARGET_PROPERTY:inference_engine,INTERFACE_INCLUDE_DIRECTORIES>
         DEPENDENCIES
-            inference_engine_ir_reader
+            ir_ngraph_frontend
         LINK_LIBRARIES
             PRIVATE
                 gflags
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/CMakeLists.txt b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/CMakeLists.txt
new file mode 100644
index 00000000000..5215943d193
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/CMakeLists.txt
@@ -0,0 +1,20 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+set(TARGET_NAME apiConformanceTests)
+
+addIeTargetTest(
+        NAME ${TARGET_NAME}
+        ROOT "${CMAKE_CURRENT_SOURCE_DIR}"
+        ADDITIONAL_SOURCE_DIRS
+            ${CMAKE_CURRENT_SOURCE_DIR}/src
+        ADD_CPPLINT
+        LINK_LIBRARIES
+            PUBLIC
+                conformanceShared
+        LABELS
+            API_CONFORMANCE
+)
+
+ie_faster_build(${TARGET_NAME} UNITY)
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/callback.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/callback.cpp
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/callback.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/callback.cpp
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/cancellation.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/cancellation.cpp
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/cancellation.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/cancellation.cpp
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/io_blob.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/io_blob.cpp
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/io_blob.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/io_blob.cpp
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/multitheading.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/multitheading.cpp
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/multitheading.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/multitheading.cpp
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/perf_counters.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/perf_counters.cpp
similarity index 70%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/perf_counters.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/perf_counters.cpp
index b7007dd16f3..a7bfe68707c 100644
--- a/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/perf_counters.cpp
+++ b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/perf_counters.cpp
@@ -18,6 +18,10 @@ const std::vector<std::map<std::string, std::string>> MulticonfigsPerfCounters =
         {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES), targetDevice }}
 };
 
+const std::vector<std::map<std::string, std::string>> AutoconfigsPerfCounters = {
+        {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES), targetDevice }}
+};
+
 INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestPerfCountersTest,
                         ::testing::Combine(
                                 ::testing::Values(targetDevice),
@@ -30,4 +34,11 @@ INSTANTIATE_TEST_SUITE_P(smoke_Multi_BehaviorTests, InferRequestPerfCountersTest
                                 ::testing::ValuesIn(MulticonfigsPerfCounters)),
                          InferRequestPerfCountersTest::getTestCaseName);
 
+INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestPerfCountersTest,
+                        ::testing::Combine(
+                                ::testing::Values(CommonTestUtils::DEVICE_AUTO),
+                                ::testing::ValuesIn(AutoconfigsPerfCounters)),
+                         InferRequestPerfCountersTest::getTestCaseName);
+
+
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/set_blob_by_type.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/set_blob_by_type.cpp
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/set_blob_by_type.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/set_blob_by_type.cpp
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/wait.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/wait.cpp
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/wait.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/infer_request/wait.cpp
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/preprocessing/set_preprocess.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/preprocessing/set_preprocess.cpp
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/preprocessing/set_preprocess.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/preprocessing/set_preprocess.cpp
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/core_config.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/core_config.cpp
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/core_config.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/core_config.cpp
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/CMakeLists.txt b/inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/CMakeLists.txt
similarity index 84%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/CMakeLists.txt
rename to inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/CMakeLists.txt
index c0df0709942..c91386906e8 100644
--- a/inference-engine/tests/functional/plugin/conformance/test_runner/CMakeLists.txt
+++ b/inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/CMakeLists.txt
@@ -2,10 +2,11 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
-set(TARGET_NAME conformanceTests)
+set(TARGET_NAME conformanceShared)
 
-addIeTargetTest(
+addIeTarget(
         NAME ${TARGET_NAME}
+        TYPE STATIC
         ROOT "${CMAKE_CURRENT_SOURCE_DIR}/include"
         ADDITIONAL_SOURCE_DIRS
             ${CMAKE_CURRENT_SOURCE_DIR}/src
@@ -17,8 +18,6 @@ addIeTargetTest(
             PUBLIC
                 gflags
                 funcSharedTests
-        LABELS
-            CONFORMANCE
 )
 
 ie_faster_build(${TARGET_NAME} UNITY)
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/include/conformance.hpp b/inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/include/conformance.hpp
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/include/conformance.hpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/include/conformance.hpp
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/include/gflag_config.hpp b/inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/include/gflag_config.hpp
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/include/gflag_config.hpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/include/gflag_config.hpp
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/main.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/src/main.cpp
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/main.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/src/main.cpp
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/skip_tests_config.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/src/skip_tests_config.cpp
similarity index 61%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/skip_tests_config.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/src/skip_tests_config.cpp
index 692c5375d43..8cb78baf2ff 100644
--- a/inference-engine/tests/functional/plugin/conformance/test_runner/src/skip_tests_config.cpp
+++ b/inference-engine/tests/functional/plugin/conformance/test_runner/conformance_infra/src/skip_tests_config.cpp
@@ -5,12 +5,18 @@
 #include <vector>
 #include <string>
 
-#include "common_test_utils/test_constants.hpp"
-
 #include "conformance.hpp"
 
 #include "functional_test_utils/skip_tests_config.hpp"
 
+namespace ConformanceTests {
+const char *targetDevice = "";
+const char *targetPluginName = "";
+
+std::vector<std::string> IRFolderPaths = {};
+std::vector<std::string> disabledTests = {};
+}
+
 std::vector<std::string> disabledTestPatterns() {
     return ConformanceTests::disabledTests;
 }
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/CMakeLists.txt b/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/CMakeLists.txt
new file mode 100644
index 00000000000..51c63ee111b
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/CMakeLists.txt
@@ -0,0 +1,20 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+set(TARGET_NAME conformanceTests)
+
+addIeTargetTest(
+        NAME ${TARGET_NAME}
+        ROOT "${CMAKE_CURRENT_SOURCE_DIR}"
+        ADDITIONAL_SOURCE_DIRS
+            ${CMAKE_CURRENT_SOURCE_DIR}/src
+        ADD_CPPLINT
+        LINK_LIBRARIES
+            PUBLIC
+                conformanceShared
+        LABELS
+            OP_CONFORMANCE
+)
+
+ie_faster_build(${TARGET_NAME} UNITY)
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/skip_configs/skip_config_cpu.lst b/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/skip_configs/skip_config_cpu.lst
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/skip_configs/skip_config_cpu.lst
rename to inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/skip_configs/skip_config_cpu.lst
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/skip_configs/skip_config_gna.lst b/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/skip_configs/skip_config_gna.lst
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/skip_configs/skip_config_gna.lst
rename to inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/skip_configs/skip_config_gna.lst
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/skip_configs/skip_config_gpu.lst b/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/skip_configs/skip_config_gpu.lst
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/skip_configs/skip_config_gpu.lst
rename to inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/skip_configs/skip_config_gpu.lst
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/skip_configs/skip_config_myriad.lst b/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/skip_configs/skip_config_myriad.lst
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/skip_configs/skip_config_myriad.lst
rename to inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/skip_configs/skip_config_myriad.lst
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/skip_configs/skip_config_template.lst b/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/skip_configs/skip_config_template.lst
similarity index 100%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/skip_configs/skip_config_template.lst
rename to inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/skip_configs/skip_config_template.lst
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/src/core_config.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/src/core_config.cpp
new file mode 100644
index 00000000000..0a79478fc6f
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/src/core_config.cpp
@@ -0,0 +1,17 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "functional_test_utils/core_config.hpp"
+
+#include "conformance.hpp"
+
+void CoreConfiguration(LayerTestsUtils::LayerTestsCommon* test) {
+    std::shared_ptr<InferenceEngine::Core> core = PluginCache::get().ie();
+    auto availableDevices = core->GetAvailableDevices();
+    std::string targetDevice = std::string(ConformanceTests::targetDevice);
+    if (std::find(availableDevices.begin(), availableDevices.end(), targetDevice) == availableDevices.end()) {
+        core->RegisterPlugin(ConformanceTests::targetPluginName,
+                             ConformanceTests::targetDevice);
+    }
+}
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/read_ir/read_ir.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/src/read_ir/read_ir.cpp
similarity index 81%
rename from inference-engine/tests/functional/plugin/conformance/test_runner/src/read_ir/read_ir.cpp
rename to inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/src/read_ir/read_ir.cpp
index c748559fd0b..35569da9e5f 100644
--- a/inference-engine/tests/functional/plugin/conformance/test_runner/src/read_ir/read_ir.cpp
+++ b/inference-engine/tests/functional/plugin/conformance/test_runner/op_conformance_runner/src/read_ir/read_ir.cpp
@@ -10,12 +10,6 @@
 namespace ConformanceTests {
 using namespace LayerTestsDefinitions;
 
-const char* targetDevice = "";
-const char* targetPluginName = "";
-
-std::vector<std::string> IRFolderPaths = {};
-std::vector<std::string> disabledTests = {};
-
 namespace {
 INSTANTIATE_TEST_SUITE_P(conformance,
                         ReadIRTest,
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/config.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/config.cpp
index 7013c3096dd..c289a5831c0 100644
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/config.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/config.cpp
@@ -62,18 +62,5 @@ namespace {
                                      ::testing::ValuesIn(MultiInConfigs)),
                                      InferRequestConfigTest::getTestCaseName);
 
-    INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestConfigTest,
-                         ::testing::Combine(
-                             ::testing::Values(1u),
-                             ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                             ::testing::ValuesIn(multiConfigs)),
-                         InferRequestConfigTest::getTestCaseName);
 
-
-    INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests_, InferRequestConfigTest,
-                         ::testing::Combine(
-                             ::testing::Values(1u),
-                             ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                             ::testing::ValuesIn(MultiInConfigs)),
-                         InferRequestConfigTest::getTestCaseName);
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
index 684f1938b37..b75a7e8c789 100644
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
@@ -37,6 +37,10 @@ const std::vector<std::map<std::string, std::string>> Multiconfigs = {
         {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_CPU}}
 };
 
+const std::vector<std::map<std::string, std::string>> Autoconfigs = {
+        {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_CPU}}
+};
+
 INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestPerfCountersTest,
                         ::testing::Combine(
                                 ::testing::Values(CommonTestUtils::DEVICE_CPU),
@@ -48,4 +52,11 @@ INSTANTIATE_TEST_SUITE_P(smoke_Multi_BehaviorTests, InferRequestPerfCountersTest
                                 ::testing::Values(CommonTestUtils::DEVICE_MULTI),
                                 ::testing::ValuesIn(Multiconfigs)),
                          InferRequestPerfCountersTest::getTestCaseName);
+
+INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestPerfCountersTest,
+                        ::testing::Combine(
+                                ::testing::Values(CommonTestUtils::DEVICE_AUTO),
+                                ::testing::ValuesIn(Autoconfigs)),
+                         InferRequestPerfCountersTest::getTestCaseName);
+
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/test_plugin.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/test_plugin.cpp
index c03c1a4f121..f7656b81c76 100644
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/test_plugin.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/test_plugin.cpp
@@ -32,6 +32,10 @@ namespace {
              {InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, InferenceEngine::PluginConfigParams::CPU_THROUGHPUT_AUTO}}
     };
 
+    const std::vector<std::map<std::string, std::string>> AutoConfigsInputOutput = {
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU}}
+    };
+
     const std::vector<std::map<std::string, std::string>> configsOutput = {
             {},
             {{InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, InferenceEngine::PluginConfigParams::CPU_THROUGHPUT_AUTO}}
@@ -56,7 +60,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(MultiConfigsInputOutput)),
+                                    ::testing::ValuesIn(AutoConfigsInputOutput)),
                             BehaviorTestOutput::getTestCaseName);
 
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, BehaviorTests,
@@ -98,7 +102,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(MultiConfigsInputOutput)),
+                                    ::testing::ValuesIn(AutoConfigsInputOutput)),
                             BehaviorTestInput::getTestCaseName);
 
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/low_precision_transformations/fake_quantize_transformation.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/low_precision_transformations/fake_quantize_transformation.cpp
index e81a0c0deee..4ed701efeca 100644
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/low_precision_transformations/fake_quantize_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/low_precision_transformations/fake_quantize_transformation.cpp
@@ -46,6 +46,7 @@ const std::vector<FakeQuantizeTransformationParam> fakeQuantizeOnDataValues = {
         { 256ul, {}, { -127.5f }, { 0.f }, { -127.5f }, { 0.f } },
         "Pooling", "U8"
     },
+    // INT4 FQ's are not transformed and inferred via FP32
     {
         { 16ul, {}, { 0.f }, { 1.5f }, { 0.f }, { 1.5f } },
         "Pooling", "FP32"
@@ -54,6 +55,23 @@ const std::vector<FakeQuantizeTransformationParam> fakeQuantizeOnDataValues = {
         { 16ul, {}, { -8.f }, { 7.f }, { -0.8f }, { 0.7f } },
         "Pooling", "FP32"
     },
+    // INT16, INT32 FQ's are transformed, but updatePrecision = false for inference on CPU Plugin and inferred via FP32
+    {
+        { 65536, {}, { 0.f }, { 65.535f }, { 0.f }, { 65.535f } },
+        "Pooling", "FP32"
+    },
+    {
+        { 65536, {}, { -32.768f }, { 32.767f }, { -32.768f }, { 32.767f } },
+        "Pooling", "FP32"
+    },
+    {
+        { 4294967296, {}, { 0.f }, { 4.294967295f }, { 0.f }, { 4.294967295f } },
+        "Pooling", "FP32"
+    },
+    {
+        { 4294967296, {}, { -2.147483648f }, { 2.147483647f }, { -2.147483648f }, { 2.147483647f } },
+        "Pooling", "FP32"
+    },
     // nGraph: I8->FP32 Convert is not supported
     // { 256ul, {}, { -1.28f} , { 1.27f }, { -1.28f} , { 1.27f } },
     // { 256ul, { 1ul }, { -1.28f} , { 1.27f } }
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/skip_tests_config.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/skip_tests_config.cpp
index c03822b7d20..37a21eb2106 100644
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/skip_tests_config.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/skip_tests_config.cpp
@@ -95,7 +95,8 @@ std::vector<std::string> disabledTestPatterns() {
         R"(smoke_CachingSupportCase_CPU/LoadNetworkCacheTestBase.CompareWithRefImpl/ReadConcatSplitAssign_f32_batch1_CPU)"
     };
 
-#if ((IE_THREAD == IE_THREAD_TBB) || (IE_THREAD == IE_THREAD_TBB_AUTO))
+#define FIX_62820 0
+#if FIX_62820 && ((IE_THREAD == IE_THREAD_TBB) || (IE_THREAD == IE_THREAD_TBB_AUTO))
     retVector.emplace_back(R"(.*ReusableCPUStreamsExecutor.*)");
 #endif
 
diff --git a/inference-engine/tests/functional/plugin/gna/pass_tests/convert_padded_to_valid_conv.cpp b/inference-engine/tests/functional/plugin/gna/pass_tests/convert_padded_to_valid_conv.cpp
index 0c3416b1969..c3b1394b5b8 100644
--- a/inference-engine/tests/functional/plugin/gna/pass_tests/convert_padded_to_valid_conv.cpp
+++ b/inference-engine/tests/functional/plugin/gna/pass_tests/convert_padded_to_valid_conv.cpp
@@ -25,10 +25,11 @@ namespace LayerTestsDefinitions {
 enum class modelType {
     TranspConvTransp = 0,               /* Transpose(NHWC->NCHW) => Conv => Transpose(NCHW->NHWC) */
     TranspConvBcastAddTransp,           /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => Transpose(NCHW->NHWC) */
+    TranspConvActTransp,                /* Transpose(NHWC->NCHW) => Conv => Activation Function => Transpose(NCHW->NHWC) */
     TranspConvBcastAddMaxPoolTransp,    /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => MaxPooling => Transpose(NCHW->NHWC) (2D Max Pool case) */
     TranspConvBcastAddActTransp,        /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => Activation Function => Transpose(NCHW->NHWC) */
     TranspConvBcastAddMaxPoolActTransp, /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => MaxPool => Activation Function => Transpose(NCHW->NHWC) */
-    TranspConvTranspBcastAdd,           /* Transpose(NHWC->NCHW) => conv => Transpose(NCHW->NHWC) => Bias */
+    TranspConvTranspBcastAdd,           /* Transpose(NHWC->NCHW) => Conv => Transpose(NCHW->NHWC) => Bias */
     TranspConvTranspBcastAddAct         /* Transpose(NHWC->NCHW) => Conv => Transpose(NCHW->NHWC) => Bias => Activation Function */
 };
 
@@ -142,6 +143,13 @@ protected:
         }
         break;
 
+        case modelType::TranspConvActTransp:
+        {
+            auto activation = std::make_shared<Relu>(conv);
+            lastOp = std::make_shared<Transpose>(activation, transposeOutOrder);
+        }
+        break;
+
         case modelType::TranspConvBcastAddMaxPoolTransp:
         {
             auto bcastAdd = std::make_shared<Add>(conv, biasConst);
@@ -257,6 +265,7 @@ const std::vector<op::PadType> padTypes = {
 const std::vector<modelType> models = {
     modelType::TranspConvTransp,
     modelType::TranspConvBcastAddTransp,
+    modelType::TranspConvActTransp,
     modelType::TranspConvBcastAddActTransp,
     modelType::TranspConvTranspBcastAdd,
     modelType::TranspConvTranspBcastAddAct,
@@ -277,8 +286,8 @@ const std::vector<std::vector<size_t >> maxpool1DPools = {{1, 2}};
 const std::vector<std::vector<size_t >> maxpool1DStrides = {{1, 1}};
 
 const std::vector<std::vector<size_t>> input2DNHWC = {{1, 16, 16, 32}};
-const std::vector<std::vector<size_t >> kernels2D = {{2, 2}, {4, 1}, {1, 3}};
-const std::vector<std::vector<size_t >> strides2D = {{1, 1}, {1, 2}, {2, 1}, {2, 2}};
+const std::vector<std::vector<size_t >> kernels2D = {{2, 2}, {4, 1}};
+const std::vector<std::vector<size_t >> strides2D = {{1, 1}, {2, 1}};
 const std::vector<std::vector<ptrdiff_t>> padBegins2D = {{1, 2}};
 const std::vector<std::vector<ptrdiff_t>> padEnds2D = {{3, 1}};
 const std::vector<std::vector<size_t >> dilations2D = {{1, 1}};
diff --git a/inference-engine/tests/functional/plugin/gna/pass_tests/decompose_2d_conv.cpp b/inference-engine/tests/functional/plugin/gna/pass_tests/decompose_2d_conv.cpp
index f193f4e4608..4554d5e5f88 100644
--- a/inference-engine/tests/functional/plugin/gna/pass_tests/decompose_2d_conv.cpp
+++ b/inference-engine/tests/functional/plugin/gna/pass_tests/decompose_2d_conv.cpp
@@ -24,6 +24,7 @@ namespace LayerTestsDefinitions {
 enum class modelType {
     TranspConvTransp = 0,               /* Transpose(NHWC->NCHW) => Conv => Transpose(NCHW->NHWC) */
     TranspConvBcastAddTransp,           /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => Transpose(NCHW->NHWC) */
+    TranspConvActTransp,                /* Transpose(NHWC->NCHW) => Conv => Activation Function => Transpose(NCHW->NHWC) */
     TranspConvBcastAddMaxPoolTransp,    /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => MaxPooling => Transpose(NCHW->NHWC) (2D Max Pool case) */
     TranspConvBcastAddActTransp,        /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => Activation Function => Transpose(NCHW->NHWC) */
     TranspConvBcastAddMaxPoolActTransp, /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => MaxPool => Activation Function => Transpose(NCHW->NHWC) */
@@ -141,13 +142,20 @@ protected:
         }
         break;
 
+        case modelType::TranspConvActTransp:
+        {
+            auto activation = std::make_shared<Relu>(conv);
+            lastOp = std::make_shared<Transpose>(activation, transposeOutOrder);
+        }
+        break;
+
         case modelType::TranspConvBcastAddMaxPoolTransp:
         {
             auto bcastAdd = std::make_shared<Add>(conv, biasConst);
             auto maxpool = std::make_shared<MaxPool>(bcastAdd, maxpoolStrides, Shape{0, 0}, Shape{0, 0}, maxpoolShape,
                 op::RoundingType::FLOOR, op::PadType::VALID);
             auto transpose = std::make_shared<Transpose>(maxpool, transposeOutOrder);
-            auto lastOp = std::make_shared<Relu>(transpose);
+            lastOp = std::make_shared<Relu>(transpose);
         }
         break;
 
@@ -221,6 +229,7 @@ const std::vector<op::PadType> padTypes = {
 const std::vector<modelType> models = {
     modelType::TranspConvTransp,
     modelType::TranspConvBcastAddTransp,
+    modelType::TranspConvActTransp,
     modelType::TranspConvBcastAddActTransp,
     modelType::TranspConvTranspBcastAdd,
     modelType::TranspConvTranspBcastAddAct,
@@ -236,9 +245,9 @@ const std::vector<std::vector<ptrdiff_t>> padEnds2D = {{3, 1}};
 const std::vector<std::vector<size_t >> dilations2D = {{1, 1}, {1, 2}, {2, 1}, {2, 2}};
 const std::vector<size_t> numOutChannels2D = {4};
 const std::vector<std::vector<size_t >> biases2D = {{1, 4, 1, 1}};
-const std::vector<std::vector<size_t >> transp_biases2D = {{1, 1, 1, 4}};
-const std::vector<std::vector<size_t >> maxpool1D_pools = {{1, 2}};
-const std::vector<std::vector<size_t >> maxpool1D_strides = {{1, 1}};
+const std::vector<std::vector<size_t >> transpBiases2D = {{1, 1, 1, 4}};
+const std::vector<std::vector<size_t >> maxpool1DPools = {{1, 2}};
+const std::vector<std::vector<size_t >> maxpool1DStrides = {{1, 1}};
 
 const auto conv2DParams = ::testing::Combine(
     ::testing::ValuesIn(kernels2D),
@@ -252,9 +261,9 @@ const auto conv2DParams = ::testing::Combine(
 
 const auto miscParams = ::testing::Combine(
     ::testing::ValuesIn(biases2D),
-    ::testing::ValuesIn(transp_biases2D),
-    ::testing::ValuesIn(maxpool1D_pools),
-    ::testing::ValuesIn(maxpool1D_strides)
+    ::testing::ValuesIn(transpBiases2D),
+    ::testing::ValuesIn(maxpool1DPools),
+    ::testing::ValuesIn(maxpool1DStrides)
 );
 
 INSTANTIATE_TEST_CASE_P(smoke_Decompose2DConv, Decompose2DConvTest,
@@ -313,4 +322,60 @@ INSTANTIATE_TEST_CASE_P(smoke_Decompose2DConvStridesDilations, Decompose2DConvTe
         ::testing::ValuesIn(modelsStrides)),
     Decompose2DConvTest::getTestCaseName);
 
+/* ============= GNA 3.0 Supported Convolutions Combination ============= */
+
+const std::vector<std::map<std::string, std::string>> configsGNA30 = {
+    {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+        {"GNA_SCALE_FACTOR_0", "1"},
+        {"GNA_EXEC_TARGET", "GNA_TARGET_3_0"}
+    }
+};
+
+const std::vector<op::PadType> padTypesGNA30 = {
+    op::PadType::VALID,
+};
+
+const std::vector<modelType> modelsGNA30 = {
+    modelType::TranspConvBcastAddMaxPoolTransp,
+};
+
+const std::vector<std::vector<size_t>> input2DNHWCGNA30 = {{1, 16, 16, 32}};
+const std::vector<std::vector<size_t >> kernels2DGNA30 = {{1, 2}, {1, 4}};
+const std::vector<std::vector<size_t >> strides2DGNA30 = {{1, 1}};
+const std::vector<std::vector<size_t >> dilations2DGNA30 = {{1, 1}, {1, 2}};
+const std::vector<size_t> numOutChannels2DGNA30 = {8};
+const std::vector<std::vector<size_t >> biases2DGNA30 = {{1, 8, 1, 1}};
+const std::vector<std::vector<size_t >> transpBiases2DGNA30 = {{1, 1, 1, 8}};
+const std::vector<std::vector<size_t >> maxpool2DPoolsGNA30 = {{1, 1}, {1, 2}};
+const std::vector<std::vector<size_t >> maxpoo2DStridesGNA30 = {{1, 1}};
+
+const auto conv2DParamsGNA30 = ::testing::Combine(
+    ::testing::ValuesIn(kernels2DGNA30),
+    ::testing::ValuesIn(strides2DGNA30),
+    ::testing::ValuesIn(padBegins2D),
+    ::testing::ValuesIn(padEnds2D),
+    ::testing::ValuesIn(dilations2DGNA30),
+    ::testing::ValuesIn(numOutChannels2DGNA30),
+    ::testing::ValuesIn(padTypesGNA30)
+);
+
+const auto miscParamsGNA30 = ::testing::Combine(
+    ::testing::ValuesIn(biases2DGNA30),
+    ::testing::ValuesIn(transpBiases2DGNA30),
+    ::testing::ValuesIn(maxpool2DPoolsGNA30),
+    ::testing::ValuesIn(maxpoo2DStridesGNA30)
+);
+
+INSTANTIATE_TEST_CASE_P(smoke_Decompose2DConvGNA30, Decompose2DConvTest,
+    ::testing::Combine(
+        conv2DParamsGNA30,
+        miscParamsGNA30,
+        ::testing::ValuesIn(netPrecisions),
+        ::testing::Values(CommonTestUtils::DEVICE_GNA),
+        ::testing::ValuesIn(configsGNA30),
+        ::testing::ValuesIn(input2DNHWCGNA30),
+        ::testing::ValuesIn(modelsGNA30)),
+    Decompose2DConvTest::getTestCaseName);
+
 } // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/plugin/gpu/behavior/cache.cpp b/inference-engine/tests/functional/plugin/gpu/behavior/cache.cpp
index 389f2b4f57d..a79e7f0a7db 100644
--- a/inference-engine/tests/functional/plugin/gpu/behavior/cache.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/behavior/cache.cpp
@@ -60,7 +60,7 @@ TEST_F(CompiledKernelsCacheTest, CanCreateCacheDirAndDumpBinariesUnicodePath) {
         std::wstring cache_path_w = CommonTestUtils::addUnicodePostfixToPath(cache_path, postfix);
 
         try {
-            auto cache_path_mb = FileUtils::wStringtoMBCSstringChar(cache_path_w);
+            auto cache_path_mb = ov::util::wstring_to_string(cache_path_w);
             std::map<std::string, std::string> config = {{ CONFIG_KEY(CACHE_DIR), cache_path_mb }};
             // Load CNNNetwork to target plugins
             auto execNet = ie->LoadNetwork(cnnNet, "GPU", config);
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/config.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/config.cpp
index b972a0e4f7c..c75aa903a21 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/config.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/config.cpp
@@ -111,6 +111,13 @@ namespace {
                 {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "1"}}
     };
 
+    const std::vector<std::map<std::string, std::string>> autoConfigs = {
+        {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+            {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES,
+             CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+    };
+
+
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, CorrectConfigAPITests,
             ::testing::Combine(
                 ::testing::ValuesIn(netPrecisions),
@@ -136,7 +143,7 @@ namespace {
             ::testing::Combine(
                     ::testing::ValuesIn(netPrecisions),
                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                    ::testing::ValuesIn(multiconf)),
+                    ::testing::ValuesIn(autoConfigs)),
             CorrectConfigAPITests::getTestCaseName);
 
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, IncorrectConfigAPITests,
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/callback.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/callback.cpp
index 90a22c2435c..dfaa591dd96 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/callback.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/callback.cpp
@@ -14,6 +14,11 @@ const std::vector<std::map<std::string, std::string>> multiConfigs = {
         {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_GPU}}
 };
 
+const std::vector<std::map<std::string, std::string>> autoConfigs = {
+    {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+        {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+};
+
 INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestCallbackTests,
         ::testing::Combine(
             ::testing::Values(CommonTestUtils::DEVICE_GPU),
@@ -27,8 +32,8 @@ INSTANTIATE_TEST_SUITE_P(smoke_Multi_BehaviorTests, InferRequestCallbackTests,
         InferRequestCallbackTests::getTestCaseName);
 
 INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestCallbackTests,
-                        ::testing::Combine(
-                            ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                            ::testing::ValuesIn(multiConfigs)),
-                        InferRequestCallbackTests::getTestCaseName);
+        ::testing::Combine(
+            ::testing::Values(CommonTestUtils::DEVICE_AUTO),
+            ::testing::ValuesIn(autoConfigs)),
+        InferRequestCallbackTests::getTestCaseName);
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
index 5a4a5852c5a..bdb9cf90518 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
@@ -14,6 +14,12 @@ namespace {
             {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_GPU}}
     };
 
+    const std::vector<std::map<std::string, std::string>> AutoConfigs = {
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+                {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES,
+                 CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+            };
+
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestPerfCountersTest,
                             ::testing::Combine(
                                     ::testing::Values(CommonTestUtils::DEVICE_GPU),
@@ -26,4 +32,10 @@ namespace {
                                     ::testing::ValuesIn(Multiconfigs)),
                              InferRequestPerfCountersTest::getTestCaseName);
 
+    INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestPerfCountersTest,
+                            ::testing::Combine(
+                                    ::testing::Values(CommonTestUtils::DEVICE_AUTO),
+                                    ::testing::ValuesIn(AutoConfigs)),
+                             InferRequestPerfCountersTest::getTestCaseName);
+
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/wait.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/wait.cpp
index 07fe3ddd855..41da3069a87 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/wait.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/wait.cpp
@@ -13,6 +13,12 @@ namespace {
             {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES, CommonTestUtils::DEVICE_GPU}}
     };
 
+    const std::vector<std::map<std::string, std::string>> autoConfigs = {
+        {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+            {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES ,
+             CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+    };
+
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestWaitTests,
                             ::testing::Combine(
                                     ::testing::Values(CommonTestUtils::DEVICE_GPU),
@@ -28,7 +34,7 @@ namespace {
     INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestWaitTests,
                             ::testing::Combine(
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(configs)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             InferRequestWaitTests::getTestCaseName);
 
-}  // namespace
\ No newline at end of file
+}  // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/preprocessing/set_preprocess.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/preprocessing/set_preprocess.cpp
index c6a17bb4bf7..950425675bc 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/preprocessing/set_preprocess.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/preprocessing/set_preprocess.cpp
@@ -22,6 +22,12 @@ namespace {
             {{ InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU}}
     };
 
+    const std::vector<std::map<std::string, std::string>> autoConfigs = {
+        {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+            {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES ,
+             CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+    };
+
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestPreprocessTest,
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
@@ -40,7 +46,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(multiConfigs)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             InferRequestPreprocessTest::getTestCaseName);
 
     const std::vector<InferenceEngine::Precision> ioPrecisions = {
@@ -85,4 +91,4 @@ namespace {
                                 ::testing::ValuesIn(configs)),
                         InferRequestPreprocessDynamicallyInSetBlobTest::getTestCaseName);
 
-}  // namespace
\ No newline at end of file
+}  // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/test_plugin.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/test_plugin.cpp
index 98069d07303..bfe1d09c36b 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/test_plugin.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/test_plugin.cpp
@@ -31,6 +31,12 @@ namespace {
             {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_GPU}}
     };
 
+    const std::vector<std::map<std::string, std::string>> autoConfigs = {
+        {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+            {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES ,
+             CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+    };
+
     const std::vector<std::map<std::string, std::string>> configsInput = {
             {},
             {{InferenceEngine::PluginConfigParams::KEY_GPU_THROUGHPUT_STREAMS, InferenceEngine::PluginConfigParams::GPU_THROUGHPUT_AUTO}}
@@ -65,7 +71,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(MultiConfigsInputOutput)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             BehaviorTestOutput::getTestCaseName);
 
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, BehaviorTests,
@@ -86,7 +92,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::Values(InferenceEngine::Precision::FP32),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(MultiConfigs)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             BehaviorTests::getTestCaseName);
 
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, BehaviorTestInput,
@@ -107,7 +113,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(MultiConfigsInputOutput)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             BehaviorTestInput::getTestCaseName);
 
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/version.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/version.cpp
index c02a209e9d5..fe7bbfa5c09 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/version.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/version.cpp
@@ -14,6 +14,12 @@ namespace {
             {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_GPU}}
     };
 
+    const std::vector<std::map<std::string, std::string>> autoConfigs = {
+        {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+            {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES ,
+             CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+    };
+
     const std::vector<std::map<std::string, std::string>> Heteroconfigs = {
             {{ HETERO_CONFIG_KEY(DUMP_GRAPH_DOT) , CommonTestUtils::DEVICE_GPU}}
     };
@@ -36,7 +42,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::Values(InferenceEngine::Precision::FP32),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(Multiconfigs)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             VersionTest::getTestCaseName);
 
     INSTANTIATE_TEST_SUITE_P(smoke_Hetero_BehaviorTests, VersionTest,
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/nms_transformation_for_last_node.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/nms_transformation_for_last_node.cpp
new file mode 100644
index 00000000000..b8cc15d0bec
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/nms_transformation_for_last_node.cpp
@@ -0,0 +1,13 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "execution_graph_tests/nms_transformation_for_last_node.hpp"
+#include "common_test_utils/test_constants.hpp"
+
+namespace {
+using namespace ExecutionGraphTests;
+
+INSTANTIATE_TEST_SUITE_P(smoke_NmsTransformationLastNode, ExecGraphNmsTransformLastNode, ::testing::Values(CommonTestUtils::DEVICE_GPU),
+                        ExecGraphNmsTransformLastNode::getTestCaseName);
+} // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/remove_parameter.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/remove_parameter.cpp
new file mode 100644
index 00000000000..5b37e05b952
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/remove_parameter.cpp
@@ -0,0 +1,16 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "execution_graph_tests/remove_parameter.hpp"
+#include "common_test_utils/test_constants.hpp"
+
+using namespace ExecutionGraphTests;
+
+namespace {
+
+INSTANTIATE_TEST_SUITE_P(smoke_removeParameter, ExecGraphRemoveParameterNode,
+                        ::testing::Values(CommonTestUtils::DEVICE_GPU),
+                        ExecGraphRemoveParameterNode::getTestCaseName);
+
+} // namespace
diff --git a/inference-engine/scripts/run_tests_myriad_multistick.sh b/inference-engine/tests/functional/plugin/myriad/run_tests_myriad_multistick.sh
similarity index 100%
rename from inference-engine/scripts/run_tests_myriad_multistick.sh
rename to inference-engine/tests/functional/plugin/myriad/run_tests_myriad_multistick.sh
diff --git a/inference-engine/tests/functional/plugin/shared/CMakeLists.txt b/inference-engine/tests/functional/plugin/shared/CMakeLists.txt
index 5a270deee45..2b55ae93aef 100644
--- a/inference-engine/tests/functional/plugin/shared/CMakeLists.txt
+++ b/inference-engine/tests/functional/plugin/shared/CMakeLists.txt
@@ -26,6 +26,7 @@ addIeTarget(
                 lptNgraphFunctions
                 sharedTestClasses
             PRIVATE
+                openvino::util
                 inference_engine_transformations
         DEPENDENCIES
             inference_engine
diff --git a/inference-engine/tests/functional/plugin/shared/include/behavior/core_integration.hpp b/inference-engine/tests/functional/plugin/shared/include/behavior/core_integration.hpp
index 27914608bbf..99525798c40 100644
--- a/inference-engine/tests/functional/plugin/shared/include/behavior/core_integration.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/behavior/core_integration.hpp
@@ -280,14 +280,14 @@ TEST_P(IEClassBasicTestP, smoke_registerPluginsXMLUnicodePath) {
             bool is_copy_successfully;
             is_copy_successfully = CommonTestUtils::copyFile(pluginXML, pluginsXmlW);
             if (!is_copy_successfully) {
-                FAIL() << "Unable to copy from '" << pluginXML << "' to '" << ::FileUtils::wStringtoMBCSstringChar(pluginsXmlW) << "'";
+                FAIL() << "Unable to copy from '" << pluginXML << "' to '" << ::ov::util::wstring_to_string(pluginsXmlW) << "'";
             }
 
             GTEST_COUT << "Test " << testIndex << std::endl;
 
             Core ie = createCoreWithTemplate();
             GTEST_COUT << "Core created " << testIndex << std::endl;
-            ASSERT_NO_THROW(ie.RegisterPlugins(::FileUtils::wStringtoMBCSstringChar(pluginsXmlW)));
+            ASSERT_NO_THROW(ie.RegisterPlugins(::ov::util::wstring_to_string(pluginsXmlW)));
             CommonTestUtils::removeFile(pluginsXmlW);
 #if defined __linux__  && !defined(__APPLE__)
             ASSERT_NO_THROW(ie.GetVersions("mock")); // from pluginXML
diff --git a/inference-engine/tests/functional/plugin/shared/include/behavior/ov_core_integration.hpp b/inference-engine/tests/functional/plugin/shared/include/behavior/ov_core_integration.hpp
index 080bcf948e1..f1f8a1aaf8a 100644
--- a/inference-engine/tests/functional/plugin/shared/include/behavior/ov_core_integration.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/behavior/ov_core_integration.hpp
@@ -215,7 +215,7 @@ TEST(OVClassBasicTest, smoke_createDefault) {
 TEST_P(OVClassBasicTestP, registerExistingPluginThrows) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED()
     ov::runtime::Core ie = createCoreWithTemplate();
-    ASSERT_THROW(ie.register_plugin(pluginName, deviceName), Exception);
+    ASSERT_THROW(ie.register_plugin(pluginName, deviceName), ov::Exception);
 }
 
 TEST_P(OVClassBasicTestP, registerNewPluginNoThrows) {
@@ -228,12 +228,12 @@ TEST_P(OVClassBasicTestP, registerNewPluginNoThrows) {
 TEST(OVClassBasicTest, smoke_registerExistingPluginFileThrows) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED()
     ov::runtime::Core ie = createCoreWithTemplate();
-    ASSERT_THROW(ie.register_plugins("nonExistPlugins.xml"), Exception);
+    ASSERT_THROW(ie.register_plugins("nonExistPlugins.xml"), ov::Exception);
 }
 
 TEST(OVClassBasicTest, smoke_createNonExistingConfigThrows) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED()
-    ASSERT_THROW(ov::runtime::Core ie("nonExistPlugins.xml"), Exception);
+    ASSERT_THROW(ov::runtime::Core ie("nonExistPlugins.xml"), ov::Exception);
 }
 
 #ifdef __linux__
@@ -252,7 +252,7 @@ TEST(OVClassBasicTest, smoke_createMockEngineConfigThrows) {
     std::string filename{"mock_engine.xml"};
     std::string content{"<ie><plugins><plugin location=\"libmock_engine.so\"></plugin></plugins></ie>"};
     CommonTestUtils::createFile(filename, content);
-    ASSERT_THROW(ov::runtime::Core ie(filename), Exception);
+    ASSERT_THROW(ov::runtime::Core ie(filename), ov::Exception);
     CommonTestUtils::removeFile(filename.c_str());
 }
 
@@ -276,14 +276,14 @@ TEST_P(OVClassBasicTestP, smoke_registerPluginsXMLUnicodePath) {
             is_copy_successfully = CommonTestUtils::copyFile(pluginXML, pluginsXmlW);
             if (!is_copy_successfully) {
                 FAIL() << "Unable to copy from '" << pluginXML << "' to '"
-                       << ::FileUtils::wStringtoMBCSstringChar(pluginsXmlW) << "'";
+                       << ::ov::util::wstring_to_string(pluginsXmlW) << "'";
             }
 
             GTEST_COUT << "Test " << testIndex << std::endl;
 
             ov::runtime::Core ie = createCoreWithTemplate();
             GTEST_COUT << "Core created " << testIndex << std::endl;
-            ASSERT_NO_THROW(ie.register_plugins(::FileUtils::wStringtoMBCSstringChar(pluginsXmlW)));
+            ASSERT_NO_THROW(ie.register_plugins(::ov::util::wstring_to_string(pluginsXmlW)));
             CommonTestUtils::removeFile(pluginsXmlW);
 #    if defined __linux__ && !defined(__APPLE__)
             ASSERT_NO_THROW(ie.get_versions("mock"));  // from pluginXML
@@ -296,7 +296,7 @@ TEST_P(OVClassBasicTestP, smoke_registerPluginsXMLUnicodePath) {
             GTEST_COUT << "Plugin registered and created " << testIndex << std::endl;
 
             GTEST_COUT << "OK" << std::endl;
-        } catch (const InferenceEngine::Exception& e_next) {
+        } catch (const ov::Exception& e_next) {
             CommonTestUtils::removeFile(pluginsXmlW);
             std::remove(pluginXML.c_str());
             FAIL() << e_next.what();
@@ -337,7 +337,7 @@ TEST_P(OVClassBasicTestP, unregisterExistingPluginNoThrow) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED()
     ov::runtime::Core ie = createCoreWithTemplate();
     // device instance is not created yet
-    ASSERT_THROW(ie.unload_plugin(deviceName), Exception);
+    ASSERT_THROW(ie.unload_plugin(deviceName), ov::Exception);
 
     // make the first call to IE which created device instance
     ie.get_versions(deviceName);
@@ -348,7 +348,7 @@ TEST_P(OVClassBasicTestP, unregisterExistingPluginNoThrow) {
 TEST_P(OVClassBasicTestP, accessToUnregisteredPluginThrows) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED()
     ov::runtime::Core ie = createCoreWithTemplate();
-    ASSERT_THROW(ie.unload_plugin(deviceName), Exception);
+    ASSERT_THROW(ie.unload_plugin(deviceName), ov::Exception);
     ASSERT_NO_THROW(ie.get_versions(deviceName));
     ASSERT_NO_THROW(ie.unload_plugin(deviceName));
     ASSERT_NO_THROW(ie.set_config({}, deviceName));
@@ -359,7 +359,7 @@ TEST_P(OVClassBasicTestP, accessToUnregisteredPluginThrows) {
 TEST(OVClassBasicTest, smoke_unregisterNonExistingPluginThrows) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED()
     ov::runtime::Core ie = createCoreWithTemplate();
-    ASSERT_THROW(ie.unload_plugin("unkown_device"), Exception);
+    ASSERT_THROW(ie.unload_plugin("unkown_device"), ov::Exception);
 }
 
 //
@@ -376,7 +376,7 @@ TEST_P(OVClassBasicTestP, SetConfigAllThrows) {
 TEST_P(OVClassBasicTestP, SetConfigForUnRegisteredDeviceThrows) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED()
     ov::runtime::Core ie = createCoreWithTemplate();
-    ASSERT_THROW(ie.set_config({{"unsupported_key", "4"}}, "unregistered_device"), Exception);
+    ASSERT_THROW(ie.set_config({{"unsupported_key", "4"}}, "unregistered_device"), ov::Exception);
 }
 
 TEST_P(OVClassBasicTestP, SetConfigNoThrow) {
@@ -501,7 +501,7 @@ TEST_P(OVClassNetworkTestP, QueryNetworkActualNoThrow) {
 
     try {
         ie.query_model(actualNetwork, deviceName);
-    } catch (const InferenceEngine::Exception& ex) {
+    } catch (const ov::Exception& ex) {
         std::string message = ex.what();
         ASSERT_STR_CONTAINS(message, "[NOT_IMPLEMENTED]  ngraph::Function is not supported natively");
     }
@@ -519,7 +519,7 @@ TEST_P(OVClassNetworkTestP, QueryNetworkWithKSO) {
                 FAIL() << "Op " << op->get_friendly_name() << " is not supported by " << deviceName;
             }
         }
-    } catch (const InferenceEngine::Exception& ex) {
+    } catch (const ov::Exception& ex) {
         std::string message = ex.what();
         ASSERT_STR_CONTAINS(message, "[NOT_IMPLEMENTED]  ngraph::Function is not supported natively");
     }
@@ -589,7 +589,7 @@ TEST_P(OVClassNetworkTestP, SetAffinityWithKSO) {
             op->get_rt_info()["affinity"] = std::make_shared<ngraph::VariantWrapper<std::string>>(affinity);
         }
         auto exeNetwork = ie.compile_model(ksoNetwork, deviceName);
-    } catch (const InferenceEngine::Exception& ex) {
+    } catch (const ov::Exception& ex) {
         std::string message = ex.what();
         ASSERT_STR_CONTAINS(message, "[NOT_IMPLEMENTED]  ngraph::Function is not supported natively");
     }
@@ -607,7 +607,7 @@ TEST_P(OVClassNetworkTestP, QueryNetworkHeteroActualNoThrow) {
 TEST_P(OVClassNetworkTestP, QueryNetworkMultiThrows) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED()
     ov::runtime::Core ie = createCoreWithTemplate();
-    ASSERT_THROW(ie.query_model(actualNetwork, CommonTestUtils::DEVICE_MULTI), Exception);
+    ASSERT_THROW(ie.query_model(actualNetwork, CommonTestUtils::DEVICE_MULTI), ov::Exception);
 }
 
 TEST(OVClassBasicTest, smoke_GetMetricSupportedMetricsHeteroNoThrow) {
@@ -649,7 +649,7 @@ TEST(OVClassBasicTest, smoke_GetMetricSupportedConfigKeysHeteroThrows) {
     ov::runtime::Core ie = createCoreWithTemplate();
     // TODO: check
     std::string targetDevice = CommonTestUtils::DEVICE_HETERO + std::string(":") + CommonTestUtils::DEVICE_CPU;
-    ASSERT_THROW(ie.get_metric(targetDevice, METRIC_KEY(SUPPORTED_CONFIG_KEYS)), Exception);
+    ASSERT_THROW(ie.get_metric(targetDevice, METRIC_KEY(SUPPORTED_CONFIG_KEYS)), ov::Exception);
 }
 
 TEST_P(OVClassGetMetricTest_SUPPORTED_METRICS, GetMetricAndPrintNoThrow) {
@@ -831,7 +831,7 @@ TEST_P(OVClassGetMetricTest_ThrowUnsupported, GetMetricThrow) {
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ASSERT_THROW(p = ie.get_metric(deviceName, "unsupported_metric"), Exception);
+    ASSERT_THROW(p = ie.get_metric(deviceName, "unsupported_metric"), ov::Exception);
 }
 
 TEST_P(OVClassGetConfigTest, GetConfigNoThrow) {
@@ -867,7 +867,7 @@ TEST_P(OVClassGetConfigTest_ThrowUnsupported, GetConfigHeteroThrow) {
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ASSERT_THROW(p = ie.get_config(CommonTestUtils::DEVICE_HETERO, "unsupported_config"), Exception);
+    ASSERT_THROW(p = ie.get_config(CommonTestUtils::DEVICE_HETERO, "unsupported_config"), ov::Exception);
 }
 
 TEST_P(OVClassGetConfigTest_ThrowUnsupported, GetConfigHeteroWithDeviceThrow) {
@@ -877,7 +877,7 @@ TEST_P(OVClassGetConfigTest_ThrowUnsupported, GetConfigHeteroWithDeviceThrow) {
 
     ASSERT_THROW(p = ie.get_config(CommonTestUtils::DEVICE_HETERO + std::string(":") + deviceName,
                                   HETERO_CONFIG_KEY(DUMP_GRAPH_DOT)),
-                 Exception);
+                 ov::Exception);
 }
 
 TEST_P(OVClassGetConfigTest_ThrowUnsupported, GetConfigThrow) {
@@ -885,7 +885,7 @@ TEST_P(OVClassGetConfigTest_ThrowUnsupported, GetConfigThrow) {
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ASSERT_THROW(p = ie.get_config(deviceName, "unsupported_config"), Exception);
+    ASSERT_THROW(p = ie.get_config(deviceName, "unsupported_config"), ov::Exception);
 }
 
 TEST_P(OVClassGetAvailableDevices, GetAvailableDevicesNoThrow) {
@@ -987,7 +987,7 @@ TEST_P(OVClassExecutableNetworkGetMetricTest_ThrowsUnsupported, GetMetricThrow)
 
     auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_THROW(p = exeNetwork.get_metric("unsupported_metric"), Exception);
+    ASSERT_THROW(p = exeNetwork.get_metric("unsupported_metric"), ov::Exception);
 }
 
 TEST_P(OVClassExecutableNetworkGetConfigTest, GetConfigNoThrow) {
@@ -1014,7 +1014,7 @@ TEST_P(OVClassExecutableNetworkGetConfigTest, GetConfigThrows) {
 
     auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_THROW(p = exeNetwork.get_config("unsupported_config"), Exception);
+    ASSERT_THROW(p = exeNetwork.get_config("unsupported_config"), ov::Exception);
 }
 
 TEST_P(OVClassExecutableNetworkSetConfigTest, SetConfigThrows) {
@@ -1024,7 +1024,7 @@ TEST_P(OVClassExecutableNetworkSetConfigTest, SetConfigThrows) {
 
     auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_THROW(exeNetwork.set_config({{"unsupported_config", "some_value"}}), Exception);
+    ASSERT_THROW(exeNetwork.set_config({{"unsupported_config", "some_value"}}), ov::Exception);
 }
 
 TEST_P(OVClassExecutableNetworkSupportedConfigTest, SupportedConfigWorks) {
@@ -1045,7 +1045,7 @@ TEST_P(OVClassExecutableNetworkUnsupportedConfigTest, UnsupportedConfigThrows) {
 
     auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_THROW(exeNetwork.set_config({{configKey, configValue}}), Exception);
+    ASSERT_THROW(exeNetwork.set_config({{configKey, configValue}}), ov::Exception);
 }
 
 TEST_P(OVClassExecutableNetworkGetConfigTest, GetConfigNoEmptyNoThrow) {
@@ -1205,7 +1205,7 @@ TEST_P(OVClassQueryNetworkTest, QueryNetworkWithDeviceID) {
     if (supportsDeviceID(ie, deviceName)) {
         try {
             ie.query_model(simpleNetwork, deviceName + ".0");
-        } catch (const InferenceEngine::Exception& ex) {
+        } catch (const ov::Exception& ex) {
             std::string message = ex.what();
             ASSERT_STR_CONTAINS(message, "[NOT_IMPLEMENTED]  ngraph::Function is not supported natively");
         }
@@ -1219,7 +1219,7 @@ TEST_P(OVClassQueryNetworkTest, QueryNetworkWithBigDeviceIDThrows) {
     ov::runtime::Core ie = createCoreWithTemplate();
 
     if (supportsDeviceID(ie, deviceName)) {
-        ASSERT_THROW(ie.query_model(actualNetwork, deviceName + ".110"), Exception);
+        ASSERT_THROW(ie.query_model(actualNetwork, deviceName + ".110"), ov::Exception);
     } else {
         GTEST_SKIP();
     }
@@ -1230,7 +1230,7 @@ TEST_P(OVClassQueryNetworkTest, QueryNetworkWithInvalidDeviceIDThrows) {
     ov::runtime::Core ie = createCoreWithTemplate();
 
     if (supportsDeviceID(ie, deviceName)) {
-        ASSERT_THROW(ie.query_model(actualNetwork, deviceName + ".l0"), Exception);
+        ASSERT_THROW(ie.query_model(actualNetwork, deviceName + ".l0"), ov::Exception);
     } else {
         GTEST_SKIP();
     }
@@ -1244,7 +1244,7 @@ TEST_P(OVClassQueryNetworkTest, QueryNetworkHETEROWithBigDeviceIDThrows) {
         ASSERT_THROW(ie.query_model(actualNetwork,
                                      CommonTestUtils::DEVICE_HETERO,
                                      {{"TARGET_FALLBACK", deviceName + ".100," + deviceName}}),
-                     Exception);
+                     ov::Exception);
     } else {
         GTEST_SKIP();
     }
@@ -1288,7 +1288,7 @@ TEST_P(OVClassLoadNetworkTest, LoadNetworkWithBigDeviceIDThrows) {
     ov::runtime::Core ie = createCoreWithTemplate();
 
     if (supportsDeviceID(ie, deviceName)) {
-        ASSERT_THROW(ie.compile_model(actualNetwork, deviceName + ".10"), Exception);
+        ASSERT_THROW(ie.compile_model(actualNetwork, deviceName + ".10"), ov::Exception);
     } else {
         GTEST_SKIP();
     }
@@ -1299,7 +1299,7 @@ TEST_P(OVClassLoadNetworkTest, LoadNetworkWithInvalidDeviceIDThrows) {
     ov::runtime::Core ie = createCoreWithTemplate();
 
     if (supportsDeviceID(ie, deviceName)) {
-        ASSERT_THROW(ie.compile_model(actualNetwork, deviceName + ".l0"), Exception);
+        ASSERT_THROW(ie.compile_model(actualNetwork, deviceName + ".l0"), ov::Exception);
     } else {
         GTEST_SKIP();
     }
@@ -1313,7 +1313,7 @@ TEST_P(OVClassLoadNetworkTest, LoadNetworkHETEROWithBigDeviceIDThrows) {
         ASSERT_THROW(ie.compile_model(actualNetwork,
                                     "HETERO",
                                     {{"TARGET_FALLBACK", deviceName + ".100," + CommonTestUtils::DEVICE_CPU}}),
-                     Exception);
+                     ov::Exception);
     } else {
         GTEST_SKIP();
     }
@@ -1328,7 +1328,7 @@ TEST_P(OVClassLoadNetworkTest, LoadNetworkHETEROAndDeviceIDThrows) {
                                     CommonTestUtils::DEVICE_HETERO,
                                     {{"TARGET_FALLBACK", deviceName + "," + CommonTestUtils::DEVICE_CPU},
                                      {CONFIG_KEY(DEVICE_ID), "110"}}),
-                     Exception);
+                     ov::Exception);
     } else {
         GTEST_SKIP();
     }
diff --git a/inference-engine/tests/functional/plugin/shared/include/single_layer_tests/convert.hpp b/inference-engine/tests/functional/plugin/shared/include/single_layer_tests/convert.hpp
deleted file mode 100644
index 02bd6dd05fc..00000000000
--- a/inference-engine/tests/functional/plugin/shared/include/single_layer_tests/convert.hpp
+++ /dev/null
@@ -1,20 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include <ie_api.h>
-IE_SUPPRESS_DEPRECATED_START
-
-#include "shared_test_classes/single_layer/convert.hpp"
-
-namespace LayerTestsDefinitions {
-
-TEST_P(ConvertLayerTest, CompareWithRefs) {
-    Run();
-};
-
-}  // namespace LayerTestsDefinitions
-
-IE_SUPPRESS_DEPRECATED_END
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convert.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convert.hpp
deleted file mode 100644
index 545d85e7752..00000000000
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convert.hpp
+++ /dev/null
@@ -1,37 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include <tuple>
-#include <string>
-#include <vector>
-#include <memory>
-
-#include "shared_test_classes/base/layer_test_utils.hpp"
-#include "ngraph_functions/builders.hpp"
-#include "ngraph_functions/utils/ngraph_helpers.hpp"
-
-namespace LayerTestsDefinitions {
-
-using ConvertParamsTuple = typename std::tuple<
-        std::vector<std::vector<size_t>>,  // Input shapes
-        InferenceEngine::Precision,        // Source precision
-        InferenceEngine::Precision,        // Target precision
-        InferenceEngine::Layout,           // Input layout
-        InferenceEngine::Layout,           // Output layout
-        std::string>;                      // Device name
-
-class INFERENCE_ENGINE_DEPRECATED("This class is deprecated and will be removed soon. "
-                                  "Please use new ConversionLayerTest class.") ConvertLayerTest :
-        public testing::WithParamInterface<ConvertParamsTuple>,
-        virtual public LayerTestsUtils::LayerTestsCommon {
-public:
-    static std::string getTestCaseName(const testing::TestParamInfo<ConvertParamsTuple> &obj);
-
-protected:
-    void SetUp() override;
-};
-
-}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convert_like.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convert_like.hpp
deleted file mode 100644
index 12d72d8a770..00000000000
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convert_like.hpp
+++ /dev/null
@@ -1,38 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include <tuple>
-#include <string>
-#include <vector>
-#include <memory>
-
-#include "shared_test_classes/base/layer_test_utils.hpp"
-#include "ngraph_functions/builders.hpp"
-#include "ngraph_functions/utils/ngraph_helpers.hpp"
-
-namespace LayerTestsDefinitions {
-
-using ConvertLikeParamsTuple = typename std::tuple<
-        std::vector<std::vector<size_t>>,  // Input1 shapes
-        InferenceEngine::Precision,        // Input1 precision
-        std::vector<std::vector<size_t>>,  // Input2 shapes
-        InferenceEngine::Precision,        // Input2 precision
-        InferenceEngine::Layout,           // Input layout
-        InferenceEngine::Layout,           // Output layout
-        std::string>;                      // Device name
-
-class INFERENCE_ENGINE_DEPRECATED("This class is deprecated and will be removed soon. "
-                                  "Please use new ConversionLayerTest class.") ConvertLikeLayerTest :
-        public testing::WithParamInterface<ConvertLikeParamsTuple>,
-        virtual public LayerTestsUtils::LayerTestsCommon {
-public:
-    static std::string getTestCaseName(const testing::TestParamInfo<ConvertLikeParamsTuple> &obj);
-
-protected:
-    void SetUp() override;
-};
-
-}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/convert.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/convert.cpp
deleted file mode 100644
index 01def7670cc..00000000000
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/convert.cpp
+++ /dev/null
@@ -1,41 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include <ie_api.h>
-IE_SUPPRESS_DEPRECATED_START
-
-#include "shared_test_classes/single_layer/convert.hpp"
-
-namespace LayerTestsDefinitions {
-
-std::string ConvertLayerTest::getTestCaseName(const testing::TestParamInfo<ConvertParamsTuple> &obj) {
-    InferenceEngine::Precision inputPrecision, targetPrecision;
-    InferenceEngine::Layout inLayout, outLayout;
-    std::string targetName;
-    std::vector<std::vector<size_t>> inputShape;
-    std::tie(inputShape, inputPrecision, targetPrecision, inLayout, outLayout, targetName) = obj.param;
-    std::ostringstream result;
-    result << "IS=" << CommonTestUtils::vec2str(inputShape) << "_";
-    result << "targetPRC=" << targetPrecision.name() << "_";
-    result << "inputPRC=" << inputPrecision.name() << "_";
-    result << "inL=" << inLayout << "_";
-    result << "outL=" << outLayout << "_";
-    result << "trgDev=" << targetName;
-    return result.str();
-}
-
-void ConvertLayerTest::SetUp() {
-    InferenceEngine::Precision inputPrecision, targetPrecision;
-    std::vector<std::vector<size_t>> inputShape;
-    std::tie(inputShape, inputPrecision, targetPrecision, inLayout, outLayout, targetDevice) = GetParam();
-    auto ngPrc = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(inputPrecision);
-    auto targetPrc = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(targetPrecision);
-    auto params = ngraph::builder::makeParams(ngPrc, inputShape);
-    auto convert = std::make_shared<ngraph::opset3::Convert>(params.front(), targetPrc);
-    ngraph::ResultVector results{std::make_shared<ngraph::opset3::Result>(convert)};
-    function = std::make_shared<ngraph::Function>(results, params, "Convert");
-}
-}  // namespace LayerTestsDefinitions
-
-IE_SUPPRESS_DEPRECATED_END
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/convert_like.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/convert_like.cpp
deleted file mode 100644
index 8f2a92b78af..00000000000
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/convert_like.cpp
+++ /dev/null
@@ -1,43 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include <ie_api.h>
-IE_SUPPRESS_DEPRECATED_START
-
-#include "shared_test_classes/single_layer/convert_like.hpp"
-
-namespace LayerTestsDefinitions {
-
-std::string ConvertLikeLayerTest::getTestCaseName(const testing::TestParamInfo<ConvertLikeParamsTuple> &obj) {
-    InferenceEngine::Precision precision, targetPrecision;
-    InferenceEngine::Layout inLayout, outLayout;
-    std::vector<std::vector<size_t>> inputShape1, inputShape2;
-    std::string targetName;
-    std::tie(inputShape1, precision, inputShape2, targetPrecision, inLayout, outLayout, targetName) = obj.param;
-    std::ostringstream result;
-    result << "IS1=" << CommonTestUtils::vec2str(inputShape1) << "_";
-    result << "IS2=" << CommonTestUtils::vec2str(inputShape2) << "_";
-    result << "PRC1=" << precision.name() << "_";
-    result << "PRC2=" << targetPrecision.name() << "_";
-    result << "inL=" << inLayout << "_";
-    result << "outL=" << outLayout << "_";
-    result << "trgDev=" << targetName;
-    return result.str();
-}
-
-void ConvertLikeLayerTest::SetUp() {
-    InferenceEngine::Precision inputPrecision, targetPrecision;
-    std::vector<std::vector<size_t>> inputShape1, inputShape2;
-    std::tie(inputShape1, inputPrecision, inputShape2, targetPrecision, inLayout, outLayout, targetDevice) = GetParam();
-    auto ngPrc1 = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(inputPrecision);
-    auto targetPrc = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(targetPrecision);
-    auto params = ngraph::builder::makeParams(ngPrc1, inputShape1);
-    params.push_back(ngraph::builder::makeParams(targetPrc, inputShape2).front());
-    auto convertLike = std::make_shared<ngraph::opset3::ConvertLike>(params.front(), params.back());
-    ngraph::ResultVector results{std::make_shared<ngraph::opset3::Result>(convertLike)};
-    function = std::make_shared<ngraph::Function>(results, params, "ConvertLike");
-}
-}  // namespace LayerTestsDefinitions
-
-IE_SUPPRESS_DEPRECATED_END
diff --git a/inference-engine/tests/ie_test_utils/common_test_utils/CMakeLists.txt b/inference-engine/tests/ie_test_utils/common_test_utils/CMakeLists.txt
index 9da03836041..833950c3d98 100644
--- a/inference-engine/tests/ie_test_utils/common_test_utils/CMakeLists.txt
+++ b/inference-engine/tests/ie_test_utils/common_test_utils/CMakeLists.txt
@@ -19,6 +19,8 @@ function(add_common_utils ADD_TARGET_NAME)
                     gtest
                     gtest_main
                     inference_engine_transformations
+                PRIVATE
+                    openvino::util
     )
 
     # USE_STATIC_IE is passed
diff --git a/inference-engine/tests/ie_test_utils/common_test_utils/file_utils.cpp b/inference-engine/tests/ie_test_utils/common_test_utils/file_utils.cpp
index a272a97741a..cd71191637f 100644
--- a/inference-engine/tests/ie_test_utils/common_test_utils/file_utils.cpp
+++ b/inference-engine/tests/ie_test_utils/common_test_utils/file_utils.cpp
@@ -2,7 +2,7 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include <ngraph/file_util.hpp>
+#include <openvino/util/file_util.hpp>
 #include <cstring>
 
 #ifdef __APPLE__
@@ -20,7 +20,6 @@
 # include <limits.h>
 #endif
 
-NGRAPH_SUPPRESS_DEPRECATED_START
 namespace CommonTestUtils {
 
 std::string getExecutableDirectory() {
@@ -41,11 +40,11 @@ std::string getExecutableDirectory() {
         throw "Can't get test executable path name";
     }
     path = std::string(buffer, len);
-    return ngraph::file_util::get_directory(path);
+    return ov::util::get_directory(path);
 }
 
 std::string getModelFromTestModelZoo(const std::string & relModelPath) {
-    return ngraph::file_util::path_join(CommonTestUtils::getExecutableDirectory(), relModelPath);
+    return ov::util::path_join({CommonTestUtils::getExecutableDirectory(), relModelPath});
 }
 
 } // namespace CommonTestUtils
diff --git a/inference-engine/tests/ie_test_utils/common_test_utils/unicode_utils.hpp b/inference-engine/tests/ie_test_utils/common_test_utils/unicode_utils.hpp
index ce0e31af860..7cb7242c96a 100644
--- a/inference-engine/tests/ie_test_utils/common_test_utils/unicode_utils.hpp
+++ b/inference-engine/tests/ie_test_utils/common_test_utils/unicode_utils.hpp
@@ -26,13 +26,13 @@ inline void fixSlashes(std::wstring &str) {
 }
 
 inline std::wstring stringToWString(std::string input) {
-    return ::FileUtils::multiByteCharToWString(input.c_str());
+    return ::ov::util::string_to_wstring(input.c_str());
 }
 
 inline bool copyFile(std::wstring source_path, std::wstring dest_path) {
 #ifndef _WIN32
-    std::ifstream source(FileUtils::wStringtoMBCSstringChar(source_path), std::ios::binary);
-    std::ofstream dest(FileUtils::wStringtoMBCSstringChar(dest_path), std::ios::binary);
+    std::ifstream source(ov::util::wstring_to_string(source_path), std::ios::binary);
+    std::ofstream dest(ov::util::wstring_to_string(dest_path), std::ios::binary);
 #else
     fixSlashes(source_path);
     fixSlashes(dest_path);
@@ -70,7 +70,7 @@ inline void removeFile(std::wstring path) {
 #ifdef _WIN32
         result = _wremove(path.c_str());
 #else
-        result = remove(FileUtils::wStringtoMBCSstringChar(path).c_str());
+        result = remove(ov::util::wstring_to_string(path).c_str());
 #endif
     }
     (void)result;
@@ -107,8 +107,8 @@ inline int removeFilesWithExt(std::wstring path, std::wstring ext) {
     }
 #else
     struct dirent *ent;
-    auto path_mb = FileUtils::wStringtoMBCSstringChar(path);
-    auto ext_mb = FileUtils::wStringtoMBCSstringChar(ext);
+    auto path_mb = ov::util::wstring_to_string(path);
+    auto ext_mb = ov::util::wstring_to_string(ext);
     DIR *dir = opendir(path_mb.c_str());
     if (dir != nullptr) {
         while ((ent = readdir(dir)) != NULL) {
@@ -136,7 +136,7 @@ inline int removeDir(std::wstring path) {
 #ifdef _WIN32
         result = _wrmdir(path.c_str());
 #else
-        result = rmdir(FileUtils::wStringtoMBCSstringChar(path).c_str());
+        result = rmdir(ov::util::wstring_to_string(path).c_str());
 #endif
     }
     return result;
@@ -150,7 +150,7 @@ inline bool directoryExists(const std::wstring &path) {
     }
 #else
     struct stat sb;
-    if (stat(FileUtils::wStringtoMBCSstringChar(path).c_str(), &sb) == 0 && S_ISDIR(sb.st_mode)) {
+    if (stat(ov::util::wstring_to_string(path).c_str(), &sb) == 0 && S_ISDIR(sb.st_mode)) {
         return true;
     }
 #endif
diff --git a/inference-engine/tests/unit/frontends/onnx_import/CMakeLists.txt b/inference-engine/tests/unit/frontends/onnx_import/CMakeLists.txt
index b7a8f3ae100..cc4ce43c727 100644
--- a/inference-engine/tests/unit/frontends/onnx_import/CMakeLists.txt
+++ b/inference-engine/tests/unit/frontends/onnx_import/CMakeLists.txt
@@ -12,6 +12,7 @@ addIeTargetTest(
             gtest_main
             commonTestUtils
             onnx_ngraph_frontend
+            openvino::util
         DEFINES
             ONNX_MODELS_DIR=\"${TEST_MODEL_ZOO}/onnx_import\"
         ADD_CPPLINT
diff --git a/inference-engine/tests/unit/frontends/onnx_import/onnx_importer_test.cpp b/inference-engine/tests/unit/frontends/onnx_import/onnx_importer_test.cpp
index a86ded8b8d4..5fc10c6e073 100644
--- a/inference-engine/tests/unit/frontends/onnx_import/onnx_importer_test.cpp
+++ b/inference-engine/tests/unit/frontends/onnx_import/onnx_importer_test.cpp
@@ -8,14 +8,12 @@
 #include <fstream>
 
 #include "common_test_utils/file_utils.hpp"
-#include "ngraph/file_util.hpp"
+#include "openvino/util/file_util.hpp"
 #include "onnx_import/onnx.hpp"
 
-NGRAPH_SUPPRESS_DEPRECATED_START
-
 TEST(ONNX_Importer_Tests, ImportBasicModel) {
     auto model_file_path = CommonTestUtils::getModelFromTestModelZoo(
-        ngraph::file_util::path_join(ONNX_MODELS_DIR, "add_abc_initializers.onnx"));
+        ov::util::path_join({ONNX_MODELS_DIR, "add_abc_initializers.onnx"}));
     auto function = ngraph::onnx_import::import_onnx_model(model_file_path);
 
     int count_additions = 0;
@@ -40,7 +38,7 @@ TEST(ONNX_Importer_Tests, ImportBasicModel) {
 
 TEST(ONNX_Importer_Tests, ImportModelWithFusedOp) {
     auto model_file_path = CommonTestUtils::getModelFromTestModelZoo(
-        ngraph::file_util::path_join(ONNX_MODELS_DIR, "selu.onnx"));
+        ov::util::path_join({ONNX_MODELS_DIR, "selu.onnx"}));
     auto function = ngraph::onnx_import::import_onnx_model(model_file_path);
 
     int count_selu = 0;
@@ -65,7 +63,7 @@ TEST(ONNX_Importer_Tests, ImportModelWithFusedOp) {
 
 TEST(ONNX_Importer_Tests, ImportModelWithMultiOutput) {
     auto model_file_path = CommonTestUtils::getModelFromTestModelZoo(
-        ngraph::file_util::path_join(ONNX_MODELS_DIR, "topk.onnx"));
+        ov::util::path_join({ONNX_MODELS_DIR, "topk.onnx"}));
     auto function = ngraph::onnx_import::import_onnx_model(model_file_path);
 
     int count_topk = 0;
@@ -93,7 +91,7 @@ TEST(ONNX_Importer_Tests, ImportModelWithMultiOutput) {
 
 TEST(ONNX_Importer_Tests, ImportModelWithNotSupportedOp) {
     auto model_file_path = CommonTestUtils::getModelFromTestModelZoo(
-        ngraph::file_util::path_join(ONNX_MODELS_DIR, "not_supported.onnx"));
+        ov::util::path_join({ONNX_MODELS_DIR, "not_supported.onnx"}));
     try {
         auto function = ngraph::onnx_import::import_onnx_model(model_file_path);
         FAIL() << "Any expection was thrown despite the ONNX model is not supported";
@@ -108,7 +106,7 @@ TEST(ONNX_Importer_Tests, ImportModelWithNotSupportedOp) {
 
 TEST(ONNX_Importer_Tests, ImportModelWhenFileDoesNotExist) {
     auto model_file_path = CommonTestUtils::getModelFromTestModelZoo(
-        ngraph::file_util::path_join(ONNX_MODELS_DIR, "not_exist_file.onnx"));
+        ov::util::path_join({ONNX_MODELS_DIR, "not_exist_file.onnx"}));
     try {
         auto function = ngraph::onnx_import::import_onnx_model(model_file_path);
         FAIL() << "Any expection was thrown despite the ONNX model file does not exist";
@@ -124,7 +122,7 @@ TEST(ONNX_Importer_Tests, ImportModelWhenFileDoesNotExist) {
 // TODO: CVS-61224
 TEST(ONNX_Importer_Tests, DISABLED_ImportModelFromStream) {
     auto model_file_path = CommonTestUtils::getModelFromTestModelZoo(
-        ngraph::file_util::path_join(ONNX_MODELS_DIR, "addmul_abc.onnx"));
+        ov::util::path_join({ONNX_MODELS_DIR, "addmul_abc.onnx"}));
     std::ifstream model_file_stream(model_file_path);
     ASSERT_TRUE(model_file_stream.is_open());
     int count_adds = 0;
diff --git a/inference-engine/tests/unit/gna/gna_api_stub.cpp b/inference-engine/tests/unit/gna/gna_api_stub.cpp
index 0761353464e..656a5790a36 100644
--- a/inference-engine/tests/unit/gna/gna_api_stub.cpp
+++ b/inference-engine/tests/unit/gna/gna_api_stub.cpp
@@ -45,6 +45,12 @@ GNA2_API enum Gna2Status Gna2MemoryAlloc(
     return Gna2StatusSuccess;
 }
 
+GNA2_API enum Gna2Status Gna2DeviceCreateForExport(
+    Gna2DeviceVersion targetDeviceVersion,
+    uint32_t * deviceIndex) {
+    *deviceIndex = 1;
+    return Gna2StatusSuccess;
+}
 GNA2_API enum Gna2Status Gna2DeviceOpen(
     uint32_t deviceIndex) {
     return Gna2StatusSuccess;
@@ -109,12 +115,6 @@ GNA2_API enum Gna2Status Gna2RequestConfigEnableActiveList(
     return Gna2StatusSuccess;
 }
 
-GNA2_API enum Gna2Status Gna2RequestConfigEnableHardwareConsistency(
-    uint32_t requestConfigId,
-    enum Gna2DeviceVersion deviceVersion) {
-    return Gna2StatusSuccess;
-}
-
 GNA2_API enum Gna2Status Gna2RequestConfigSetAccelerationMode(
     uint32_t requestConfigId,
     enum Gna2AccelerationMode accelerationMode) {
diff --git a/inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_padded_to_valid_convolution.cpp b/inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_padded_to_valid_convolution.cpp
index dc3501a980b..003f42b6757 100644
--- a/inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_padded_to_valid_convolution.cpp
+++ b/inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_padded_to_valid_convolution.cpp
@@ -20,6 +20,7 @@ namespace {
 enum class modelType {
     TranspConvTransp = 0,               /* Transpose(NHWC->NCHW) => Conv => Transpose(NCHW->NHWC) */
     TranspConvBcastAddTransp,           /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => Transpose(NCHW->NHWC) */
+    TranspConvActTransp,                /* Transpose(NHWC->NCHW) => Conv => Activation Function => Transpose(NCHW->NHWC) */
     TranspConvBcastAddMaxPoolTransp,    /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => MaxPooling => Transpose(NCHW->NHWC) (2D Max Pool case) */
     TranspConvBcastAddActTransp,        /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => Activation Function => Transpose(NCHW->NHWC) */
     TranspConvBcastAddMaxPoolActTransp, /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => MaxPool => Activation Function => Transpose(NCHW->NHWC) */
@@ -66,7 +67,7 @@ void GetConvParams(std::shared_ptr<ngraph::opset7::Convolution> conv, ConvData&
     conv_data.pads_end_width = conv->get_pads_end()[1];
 }
 
-std::shared_ptr<ngraph::opset7::FakeQuantize> createFQ(ngraph::Output<ngraph::Node>& in_node) {
+std::shared_ptr<ngraph::opset7::FakeQuantize> createFQ(std::shared_ptr<ngraph::Node>& in_node) {
     auto input_low = ngraph::opset7::Constant::create(ngraph::element::f32, ngraph::Shape{1}, {1});
     auto input_high = ngraph::opset7::Constant::create(ngraph::element::f32, ngraph::Shape{1}, {5});
     auto output_low = ngraph::opset7::Constant::create(ngraph::element::f32, ngraph::Shape{1}, {0});
@@ -76,7 +77,7 @@ std::shared_ptr<ngraph::opset7::FakeQuantize> createFQ(ngraph::Output<ngraph::No
 
 ngraph::Output<ngraph::Node> createBiasFQ(const ngraph::Output<ngraph::Node>& in_node,
     std::shared_ptr<ngraph::opset7::Constant>& bias_const, const bool& fq) {
-    ngraph::Output<ngraph::Node> bcast_add = std::make_shared<ngraph::opset7::Add>(in_node, bias_const);
+    std::shared_ptr<ngraph::Node> bcast_add = std::make_shared<ngraph::opset7::Add>(in_node, bias_const);
 
     if (fq) {
         bcast_add = createFQ(bcast_add);
@@ -100,7 +101,7 @@ std::shared_ptr<ngraph::opset7::Result> createFunction(const bool& fq,
     ConvData* conv_data) {
     auto transpose_in_order = std::make_shared<ngraph::opset7::Constant>(ngraph::element::i64, ngraph::Shape{4}, std::vector<int64_t>{0, 3, 1, 2});
     auto transpose_in = std::make_shared<ngraph::opset7::Transpose>(input_node, transpose_in_order);
-    ngraph::Output<ngraph::Node> filters = std::make_shared<ngraph::opset7::Constant>(ngraph::element::i64,
+    std::shared_ptr<ngraph::Node> filters = std::make_shared<ngraph::opset7::Constant>(ngraph::element::i64,
         ngraph::Shape{4, input_node.get_shape()[3], filters_shape[0], filters_shape[1]});
 
     if (fq) {
@@ -123,6 +124,19 @@ std::shared_ptr<ngraph::opset7::Result> createFunction(const bool& fq,
     }
     break;
 
+    case modelType::TranspConvActTransp:
+    {
+        auto bcast_add = createBiasFQ(conv, bias_const, fq);
+        std::shared_ptr<ngraph::Node> activation = std::make_shared<ngraph::opset7::Relu>(bcast_add);
+
+        if (fq) {
+            activation = createFQ(activation);
+        }
+
+        last_op = std::make_shared<ngraph::opset7::Transpose>(activation, transpose_out_order);
+    }
+    break;
+
     case modelType::TranspConvBcastAddMaxPoolTransp:
     {
         auto bcast_add = createBiasFQ(conv, bias_const, fq);
@@ -428,6 +442,9 @@ INSTANTIATE_TEST_SUITE_P(ConvertPaddedToValidConvTestSuite, ConvertPaddedToValid
             std::make_tuple(modelType::TranspConvBcastAddTransp, ngraph::PartialShape{1, 1, 16, 8}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
                 ngraph::CoordinateDiff{0, 2}, ngraph::CoordinateDiff{0, 3}, ngraph::Strides{1, 1},
                 ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 2}, ngraph::op::PadType::EXPLICIT),
+            std::make_tuple(modelType::TranspConvActTransp, ngraph::PartialShape{1, 1, 16, 8}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
+                ngraph::CoordinateDiff{0, 2}, ngraph::CoordinateDiff{0, 3}, ngraph::Strides{1, 1},
+                ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 2}, ngraph::op::PadType::EXPLICIT),
             std::make_tuple(modelType::TranspConvBcastAddMaxPoolTransp, ngraph::PartialShape{1, 1, 16, 8}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
                 ngraph::CoordinateDiff{0, 2}, ngraph::CoordinateDiff{0, 3}, ngraph::Strides{1, 1},
                 ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 2}, ngraph::op::PadType::EXPLICIT),
@@ -459,6 +476,9 @@ INSTANTIATE_TEST_SUITE_P(ConvertPaddedToValidConvInvalidTestSuite, ConvertPadded
             std::make_tuple(modelType::TranspConvBcastAddTransp, ngraph::PartialShape{2, 1, 16, 8}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
                 ngraph::CoordinateDiff{0, 2}, ngraph::CoordinateDiff{0, 3}, ngraph::Strides{1, 1},
                 ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 2}, ngraph::op::PadType::EXPLICIT),
+            std::make_tuple(modelType::TranspConvActTransp, ngraph::PartialShape{2, 1, 16, 8}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
+                ngraph::CoordinateDiff{0, 2}, ngraph::CoordinateDiff{0, 3}, ngraph::Strides{1, 1},
+                ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 2}, ngraph::op::PadType::EXPLICIT),
             std::make_tuple(modelType::TranspConvBcastAddMaxPoolTransp, ngraph::PartialShape{2, 16, 16, 8}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
                 ngraph::CoordinateDiff{0, 2}, ngraph::CoordinateDiff{0, 3}, ngraph::Strides{1, 1},
                 ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{5, 1}, ngraph::op::PadType::EXPLICIT),
diff --git a/inference-engine/tests/unit/gna/ngraph/transformations/gna_decompose_2d_convolution.cpp b/inference-engine/tests/unit/gna/ngraph/transformations/gna_decompose_2d_convolution.cpp
index 483f5c67a45..c7fbfe9697c 100644
--- a/inference-engine/tests/unit/gna/ngraph/transformations/gna_decompose_2d_convolution.cpp
+++ b/inference-engine/tests/unit/gna/ngraph/transformations/gna_decompose_2d_convolution.cpp
@@ -22,6 +22,7 @@ namespace {
 enum class modelType {
     TranspConvTransp = 0,               /* Transpose(NHWC->NCHW) => Conv => Transpose(NCHW->NHWC) */
     TranspConvBcastAddTransp,           /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => Transpose(NCHW->NHWC) */
+    TranspConvActTransp,                /* Transpose(NHWC->NCHW) => Conv => Activation Function => Transpose(NCHW->NHWC) */
     TranspConvBcastAddMaxPoolTransp,    /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => MaxPooling => Transpose(NCHW->NHWC) (2D Max Pool case) */
     TranspConvBcastAddActTransp,        /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => Activation Function => Transpose(NCHW->NHWC) */
     TranspConvBcastAddMaxPoolActTransp, /* Transpose(NHWC->NCHW) => Conv => Broadcasted Add (Bias) => MaxPool => Activation Function => Transpose(NCHW->NHWC) */
@@ -157,6 +158,19 @@ std::shared_ptr<ngraph::opset7::Result> createFunction(const bool& fq,
     }
     break;
 
+    case modelType::TranspConvActTransp:
+    {
+        fq_bias = createBiasFQ(conv, bias_const, bias, fq);
+        std::shared_ptr<ngraph::Node> activation = std::make_shared<ngraph::opset7::Relu>(fq_bias);
+
+        if (fq) {
+            activation = createFQ(activation);
+        }
+
+        last_op = std::make_shared<ngraph::opset7::Transpose>(activation, transpose_out_order);
+    }
+    break;
+
     case modelType::TranspConvBcastAddMaxPoolTransp:
     {
         fq_bias = createBiasFQ(conv, bias_const, bias, fq);
@@ -555,7 +569,7 @@ std::shared_ptr<ngraph::Node> CreateDeomposedConv(const GraphData& graph_data, C
             // We need to calculate some parameters in case horizontal stride > 1 is used, because if we use the ones available from the original convolution
             // we won't take into account the fact horizontal strides will be supported by the newly created 1D convolution, and not by decomposition
             size_t filter_dilation_width = conv_params.filter_width > 1 ? conv_params.filter_dilation_width : 1;
-            size_t output_width = (conv_params.input_width - (conv_params.filter_width + filter_dilation_width - 2));
+            size_t output_width = (conv_params.input_width - (filter_dilation_width * (conv_params.filter_width - 1)));
 
             if (conv_params.filter_width > 1) {
                 for (size_t filter_width = 0; filter_width < conv_params.filter_width; filter_width++) {
@@ -695,21 +709,23 @@ std::shared_ptr<ngraph::Function> Decompose2DConvTestFixture::get_reference(cons
 void execute_test(modelType model, std::shared_ptr<ngraph::Function> function, std::shared_ptr<ngraph::Function> reference_function) {
     ngraph::pass::Manager manager;
     manager.register_pass<ngraph::pass::InitNodeInfo>();
+    InferenceEngine::Precision gnaPrecision = InferenceEngine::Precision::I16;
 
     switch (model) {
     default:
     case modelType::TranspConvTransp:
     case modelType::TranspConvBcastAddTransp:
+    case modelType::TranspConvActTransp:
     case modelType::TranspConvBcastAddMaxPoolTransp:
     case modelType::TranspConvBcastAddActTransp:
     case modelType::TranspConvBcastAddMaxPoolActTransp:
-        manager.register_pass<GNAPluginNS::Decompose2DConv>();
+        manager.register_pass<GNAPluginNS::Decompose2DConv>("", gnaPrecision);
         break;
     case modelType::TranspConvTranspBcastAdd:
-        manager.register_pass<GNAPluginNS::Decompose2DConvTransposedWithBias>();
+        manager.register_pass<GNAPluginNS::Decompose2DConvTransposedWithBias>("", gnaPrecision);
         break;
     case modelType::TranspConvTranspBcastAddAct:
-        manager.register_pass<GNAPluginNS::Decompose2DConvTransposedWithBiasAF>();
+        manager.register_pass<GNAPluginNS::Decompose2DConvTransposedWithBiasAF>("", gnaPrecision);
         break;
     }
 
@@ -732,6 +748,8 @@ INSTANTIATE_TEST_SUITE_P(Decompose2DConvTestSuite, Decompose2DConvTestFixture,
                 ngraph::Strides{1, 1}, ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 1}),
             std::make_tuple(modelType::TranspConvBcastAddTransp, ngraph::PartialShape{1, 4, 4, 32}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
                 ngraph::Strides{1, 1}, ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 1}),
+            std::make_tuple(modelType::TranspConvActTransp, ngraph::PartialShape{1, 4, 4, 32}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
+                ngraph::Strides{1, 1}, ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 1}),
             std::make_tuple(modelType::TranspConvBcastAddMaxPoolTransp, ngraph::PartialShape{1, 4, 4, 32}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
                 ngraph::Strides{1, 1}, ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 1}),
             std::make_tuple(modelType::TranspConvBcastAddActTransp, ngraph::PartialShape{1, 4, 4, 32}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
@@ -756,6 +774,8 @@ INSTANTIATE_TEST_SUITE_P(Decompose2DConvInvalidTestSuite, Decompose2DConvTestInv
                 ngraph::Strides{1, 1}, ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 2}),
             std::make_tuple(modelType::TranspConvBcastAddTransp, ngraph::PartialShape{2, 4, 4, 32}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
                 ngraph::Strides{1, 1}, ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 2}),
+            std::make_tuple(modelType::TranspConvActTransp, ngraph::PartialShape{2, 4, 4, 32}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
+                ngraph::Strides{1, 1}, ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{1, 2}),
             std::make_tuple(modelType::TranspConvBcastAddMaxPoolTransp, ngraph::PartialShape{1, 16, 16, 128}, ngraph::Shape{5, 5}, ngraph::Strides{1, 1},
                 ngraph::Strides{1, 1}, ngraph::Shape{1, 4, 1, 1}, ngraph::Strides{1, 1}, ngraph::Shape{2, 2}),
             std::make_tuple(modelType::TranspConvBcastAddActTransp, ngraph::PartialShape{2, 4, 4, 32}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
diff --git a/inference-engine/tests/unit/inference_engine/ie_blob_test.cpp b/inference-engine/tests/unit/inference_engine/ie_blob_test.cpp
index d84f185727b..0045080c4d2 100644
--- a/inference-engine/tests/unit/inference_engine/ie_blob_test.cpp
+++ b/inference-engine/tests/unit/inference_engine/ie_blob_test.cpp
@@ -461,3 +461,119 @@ TEST_F(BlobTests, readRoiBlob) {
         }
     }
 }
+
+/////////////////////////////////////////
+
+TEST_F(BlobTests, makeRangeRoiBlobNchw) {
+    // we create main blob with NCHW layout. We will crop ROI from this blob.
+    InferenceEngine::SizeVector dims = {1, 3, 6, 5};  // RGB picture of size (WxH) = 5x6
+    InferenceEngine::Blob::Ptr blob = InferenceEngine::make_shared_blob<uint8_t>(
+            InferenceEngine::TensorDesc(InferenceEngine::Precision::U8, dims, InferenceEngine::NCHW));
+    blob->allocate();
+
+    // create ROI blob based on the already created blob
+    InferenceEngine::ROI roi = {0, 2, 1, 2, 4};  // cropped picture with: id = 0, (x,y) = (2,1), sizeX (W) = 2, sizeY (H) = 4
+    InferenceEngine::Blob::Ptr roiBlob = make_shared_blob(blob,
+        {0, 0, roi.posY, roi.posX},
+        {1, 3, roi.posY + roi.sizeY, roi.posX + roi.sizeX});
+
+    // check that BlockingDesc is constructed properly for the ROI blob
+    InferenceEngine::SizeVector refDims = {1, 3, 4, 2};
+    InferenceEngine::SizeVector refOrder = {0, 1, 2, 3};
+    size_t refOffset = 7;
+    InferenceEngine::SizeVector refStrides = {90, 30, 5, 1};
+    ASSERT_EQ(roiBlob->getTensorDesc().getBlockingDesc().getBlockDims(), refDims);
+    ASSERT_EQ(roiBlob->getTensorDesc().getBlockingDesc().getOrder(), refOrder);
+    ASSERT_EQ(roiBlob->getTensorDesc().getBlockingDesc().getOffsetPadding(), refOffset);
+    ASSERT_EQ(roiBlob->getTensorDesc().getBlockingDesc().getStrides(), refStrides);
+}
+
+TEST_F(BlobTests, makeRangeRoiBlobNhwc) {
+    // we create main blob with NHWC layout. We will crop ROI from this blob.
+    InferenceEngine::SizeVector dims = {1, 3, 4, 8};  // RGB picture of size (WxH) = 8x4
+    InferenceEngine::Blob::Ptr blob = InferenceEngine::make_shared_blob<uint8_t>(
+            InferenceEngine::TensorDesc(InferenceEngine::Precision::U8, dims, InferenceEngine::NHWC));
+    blob->allocate();
+
+    // create ROI blob based on the already created blob
+    InferenceEngine::ROI roi = {0, 3, 2, 5, 2};  // cropped picture with: id = 0, (x,y) = (3,2), sizeX (W) = 5, sizeY (H) = 2
+        InferenceEngine::Blob::Ptr roiBlob = make_shared_blob(blob,
+        {0, 0, roi.posY, roi.posX},
+        {1, 3, roi.posY + roi.sizeY, roi.posX + roi.sizeX});
+
+    // check that BlockingDesc is constructed properly for the ROI blob
+    InferenceEngine::SizeVector refDims = {1, 2, 5, 3};
+    InferenceEngine::SizeVector refOrder = {0, 2, 3, 1};
+    size_t refOffset = 57;
+    InferenceEngine::SizeVector refStrides = {96, 24, 3, 1};
+    ASSERT_EQ(roiBlob->getTensorDesc().getBlockingDesc().getBlockDims(), refDims);
+    ASSERT_EQ(roiBlob->getTensorDesc().getBlockingDesc().getOrder(), refOrder);
+    ASSERT_EQ(roiBlob->getTensorDesc().getBlockingDesc().getOffsetPadding(), refOffset);
+    ASSERT_EQ(roiBlob->getTensorDesc().getBlockingDesc().getStrides(), refStrides);
+}
+
+TEST_F(BlobTests, makeRangeRoiBlobWrongSize) {
+    // we create main blob with NCHW layout. We will crop ROI from this blob.
+    InferenceEngine::SizeVector dims = {1, 3, 4, 4};  // RGB picture of size (WxH) = 4x4
+    InferenceEngine::Blob::Ptr blob = InferenceEngine::make_shared_blob<uint8_t>(
+            InferenceEngine::TensorDesc(InferenceEngine::Precision::U8, dims, InferenceEngine::NCHW));
+    blob->allocate();
+
+    // try to create ROI blob with wrong size
+    InferenceEngine::ROI roi = {0, 1, 1, 4, 4};  // cropped picture with: id = 0, (x,y) = (1,1), sizeX (W) = 4, sizeY (H) = 4
+    ASSERT_THROW(make_shared_blob(blob,
+        {0, 0, roi.posY, roi.posX},
+        {1, 3, roi.posY + roi.sizeY, roi.posX + roi.sizeX}), InferenceEngine::Exception);
+}
+
+TEST_F(BlobTests, readRangeRoiBlob) {
+    // Create original Blob
+
+    const auto origDesc =
+        InferenceEngine::TensorDesc(
+            InferenceEngine::Precision::I32,
+            {1, 3, 4, 8},
+            InferenceEngine::NCHW);
+
+    const auto origBlob =
+        InferenceEngine::make_shared_blob<int32_t>(origDesc);
+    origBlob->allocate();
+
+    // Fill the original Blob
+
+    {
+        auto origMemory = origBlob->wmap();
+        const auto origPtr = origMemory.as<int32_t*>();
+        ASSERT_NE(nullptr, origPtr);
+
+        for (size_t i = 0; i < origBlob->size(); ++i) {
+            origPtr[i] = i;
+        }
+    }
+
+    // Create ROI Blob
+
+    const auto roi = InferenceEngine::ROI(0, 4, 2, 4, 2);
+
+    const auto roiBlob = InferenceEngine::as<InferenceEngine::MemoryBlob>(origBlob->createROI(
+        {0, 0, roi.posY, roi.posX},
+        {1, 3, roi.posY + roi.sizeY, roi.posX + roi.sizeX}));
+    ASSERT_NE(nullptr, roiBlob);
+
+    // Read ROI Blob
+
+    {
+        const auto roiOffset = roiBlob->getTensorDesc().getBlockingDesc().getOffsetPadding();
+
+        auto roiMemory = roiBlob->rmap();
+        auto roiPtr = roiMemory.as<const int32_t*>();
+        ASSERT_NE(nullptr, roiPtr);
+
+        // Blob::rmap returns pointer to the original blob start, we have to add ROI offset manually.
+        roiPtr += roiOffset;
+
+        for (size_t i = 0; i < roiBlob->size(); ++i) {
+            ASSERT_EQ(roiPtr[i], i + roiOffset);
+        }
+    }
+}
diff --git a/inference-engine/tests_deprecated/fluid_preproc/CMakeLists.txt b/inference-engine/tests_deprecated/fluid_preproc/CMakeLists.txt
index 703d9085c82..b18876cc101 100644
--- a/inference-engine/tests_deprecated/fluid_preproc/CMakeLists.txt
+++ b/inference-engine/tests_deprecated/fluid_preproc/CMakeLists.txt
@@ -23,7 +23,7 @@ target_include_directories(${TARGET} PRIVATE
           $<TARGET_PROPERTY:inference_engine_plugin_api,INTERFACE_INCLUDE_DIRECTORIES>
           $<TARGET_PROPERTY:inference_engine_preproc,INTERFACE_INCLUDE_DIRECTORIES>)
 
-target_link_libraries(${TARGET} PRIVATE opencv_core opencv_imgproc
+target_link_libraries(${TARGET} PRIVATE opencv_core opencv_imgproc openvino::util
     inference_engine fluid_test_computations gtest gtest_main)
 
 if(GAPI_TEST_PERF)
diff --git a/inference-engine/tests_deprecated/functional/vpu/vpu_base/myriad_layers_reference_functions.cpp b/inference-engine/tests_deprecated/functional/vpu/vpu_base/myriad_layers_reference_functions.cpp
index 5f17d392604..e4665e1b30d 100644
--- a/inference-engine/tests_deprecated/functional/vpu/vpu_base/myriad_layers_reference_functions.cpp
+++ b/inference-engine/tests_deprecated/functional/vpu/vpu_base/myriad_layers_reference_functions.cpp
@@ -1944,7 +1944,7 @@ namespace internal {
               T hy = static_cast<T>(1) - ly, hx = static_cast<T>(1) - lx;
               T w1 = hy * hx, w2 = hy * lx, w3 = ly * hx, w4 = ly * lx;
 
-              // save weights and indeces
+              // save weights and indices
               PreCalc<T> pc;
               pc.pos1 = y_low * width + x_low;
               pc.pos2 = y_low * width + x_high;
@@ -2014,7 +2014,7 @@ namespace internal {
         // We do average (integral) pooling inside a bin
         const T count = static_cast<T>(roi_bin_grid_h * roi_bin_grid_w);  // e.g. = 4
 
-        // we want to precalculate indeces and weights shared by all chanels,
+        // we want to precalculate indices and weights shared by all chanels,
         // this is the key point of optimiation
         std::vector<PreCalc<T>> pre_calc(
             roi_bin_grid_h * roi_bin_grid_w * pooled_width * pooled_height);
@@ -2302,7 +2302,7 @@ namespace internal {
             // We do average (integral) pooling inside a bin
             const T count = static_cast<T>(roi_bin_grid_h * roi_bin_grid_w);  // e.g. = 4
 
-            // we want to precalculate indeces and weights shared by all chanels,
+            // we want to precalculate indices and weights shared by all chanels,
             // this is the key point of optimiation
             std::vector<PreCalc<T>> pre_calc(
                 roi_bin_grid_h * roi_bin_grid_w * pooled_width * pooled_height);
diff --git a/inference-engine/tests_deprecated/unit/engines/gna/gna_api_stub.cpp b/inference-engine/tests_deprecated/unit/engines/gna/gna_api_stub.cpp
index fd70db84eb5..92e0dfc21f7 100644
--- a/inference-engine/tests_deprecated/unit/engines/gna/gna_api_stub.cpp
+++ b/inference-engine/tests_deprecated/unit/engines/gna/gna_api_stub.cpp
@@ -44,6 +44,13 @@ GNA2_API enum Gna2Status Gna2MemoryAlloc(
     return Gna2StatusSuccess;
 }
 
+GNA2_API enum Gna2Status Gna2DeviceCreateForExport(
+    Gna2DeviceVersion targetDeviceVersion,
+    uint32_t * deviceIndex) {
+    *deviceIndex = 1;
+    return Gna2StatusSuccess;
+}
+
 GNA2_API enum Gna2Status Gna2DeviceOpen(
     uint32_t deviceIndex) {
     if (current != nullptr) {
@@ -139,15 +146,6 @@ GNA2_API enum Gna2Status Gna2RequestConfigEnableActiveList(
     return Gna2StatusSuccess;
 }
 
-GNA2_API enum Gna2Status Gna2RequestConfigEnableHardwareConsistency(
-    uint32_t requestConfigId,
-    enum Gna2DeviceVersion deviceVersion) {
-    if (current != nullptr) {
-        return current->Gna2RequestConfigEnableHardwareConsistency(requestConfigId, deviceVersion);
-    }
-    return Gna2StatusSuccess;
-}
-
 GNA2_API enum Gna2Status Gna2RequestConfigSetAccelerationMode(
     uint32_t requestConfigId,
     enum Gna2AccelerationMode accelerationMode) {
diff --git a/inference-engine/tests_deprecated/unit/engines/gna/gna_matcher.cpp b/inference-engine/tests_deprecated/unit/engines/gna/gna_matcher.cpp
index 2cc7c23634a..c0a5719783d 100644
--- a/inference-engine/tests_deprecated/unit/engines/gna/gna_matcher.cpp
+++ b/inference-engine/tests_deprecated/unit/engines/gna/gna_matcher.cpp
@@ -66,7 +66,7 @@ public:
     }
 };
 #if GNA_LIB_VER == 2
-void expect_enqueue_calls(GNACppApi &mockApi, bool enableHardwareConsistency = true){
+void expect_enqueue_calls(GNACppApi &mockApi){
     EXPECT_CALL(mockApi, Gna2ModelCreate(_,_,_)).Times(AtLeast(1)).WillRepeatedly(Invoke([](
         uint32_t deviceIndex,
         struct Gna2Model const * model,
@@ -82,10 +82,6 @@ void expect_enqueue_calls(GNACppApi &mockApi, bool enableHardwareConsistency = t
             return Gna2StatusSuccess;
         }));
 
-    if (enableHardwareConsistency) {
-        EXPECT_CALL(mockApi, Gna2RequestConfigEnableHardwareConsistency(_,_)).Times(AtLeast(1)).WillRepeatedly(Return(Gna2StatusSuccess));
-    }
-
     EXPECT_CALL(mockApi, Gna2RequestConfigSetAccelerationMode(_,_)).Times(AtLeast(1)).WillRepeatedly(Return(Gna2StatusSuccess));
 
     EXPECT_CALL(mockApi, Gna2InstrumentationConfigAssignToRequestConfig(_,_)).Times(AtLeast(1)).WillRepeatedly(Return(Gna2StatusSuccess));
@@ -352,11 +348,7 @@ void GNAPropagateMatcher :: match() {
                         EXPECT_CALL(mockApi, GNAPropagateForward(_, _, _, _, _, Eq(_env.proc_type)))
                             .WillOnce(Return(GNA_NOERROR));
 #elif GNA_LIB_VER == 2
-                        if(_env.proc_type == (GNA_SOFTWARE & GNA_HARDWARE)) {
-                            expect_enqueue_calls(mockApi);
-                        } else {
-                            expect_enqueue_calls(mockApi, false);
-                        }
+                        expect_enqueue_calls(mockApi);
 #endif
                         break;
                     case GnaPluginTestEnvironment::matchPwlInserted :
@@ -574,8 +566,6 @@ void GNAPluginAOTMatcher :: match() {
             return Gna2StatusSuccess;
         }));
 
-    EXPECT_CALL(mockApi, Gna2RequestConfigEnableHardwareConsistency(_,_)).Times(AtLeast(1)).WillRepeatedly(Return(Gna2StatusSuccess));
-
     EXPECT_CALL(mockApi, Gna2InstrumentationConfigAssignToRequestConfig(_,_)).Times(AtLeast(1)).WillRepeatedly(Return(Gna2StatusSuccess));
 #else
 #error "Not supported GNA_LIB_VER"
@@ -703,8 +693,6 @@ void GNADumpXNNMatcher::match() {
 
         ON_CALL(mockApi, Gna2RequestConfigSetAccelerationMode(_,_)).WillByDefault(Return(Gna2StatusSuccess));
 
-        ON_CALL(mockApi, Gna2RequestConfigEnableHardwareConsistency(_,_)).WillByDefault(Return(Gna2StatusSuccess));
-
         ON_CALL(mockApi, Gna2InstrumentationConfigAssignToRequestConfig(_,_)).WillByDefault(Return(Gna2StatusSuccess));
     }
 #else
@@ -808,8 +796,6 @@ void GNAQueryStateMatcher :: match() {
             return Gna2StatusSuccess;
         }));
 
-    EXPECT_CALL(mockApi, Gna2RequestConfigEnableHardwareConsistency(_,_)).Times(AtLeast(1)).WillRepeatedly(Return(Gna2StatusSuccess));
-
     EXPECT_CALL(mockApi, Gna2InstrumentationConfigAssignToRequestConfig(_,_)).Times(AtLeast(1)).WillRepeatedly(Return(Gna2StatusSuccess));
 #endif
     IE_SUPPRESS_DEPRECATED_START
diff --git a/inference-engine/thirdparty/CMakeLists.txt b/inference-engine/thirdparty/CMakeLists.txt
index 7a3ee97b789..37186f129c2 100644
--- a/inference-engine/thirdparty/CMakeLists.txt
+++ b/inference-engine/thirdparty/CMakeLists.txt
@@ -34,8 +34,9 @@ function(ie_add_mkldnn)
     set(DNNL_LIBRARY_TYPE STATIC CACHE BOOL "" FORCE)
     set(DNNL_BUILD_EXAMPLES OFF CACHE BOOL "" FORCE)
     set(DNNL_BUILD_TESTS OFF CACHE BOOL "" FORCE)
-    set(DNNL_CPU_RUNTIME "${THREADING}" CACHE BOOL "" FORCE)
-    set(DNNL_BLAS_VENDOR "NONE" CACHE BOOL "" FORCE)
+    set(DNNL_CPU_RUNTIME "${THREADING}" CACHE STRING "" FORCE)
+    set(DNNL_GPU_RUNTIME "NONE" CACHE STRING "" FORCE)
+    set(DNNL_BLAS_VENDOR "NONE" CACHE STRING "" FORCE)
     set(SDL_cmake_included ON)  ## to skip internal SDL flags. SDL flags are already set on IE level
     if (ANDROID OR ((CMAKE_CXX_COMPILER_ID STREQUAL "MSVC") AND NOT (THREADING STREQUAL "OMP")))
         set(OpenMP_cmake_included ON) ## to skip "omp simd" inside a code. Lead to some crashes inside NDK LLVM..
diff --git a/inference-engine/thirdparty/clDNN/CMakeLists.txt b/inference-engine/thirdparty/clDNN/CMakeLists.txt
index 63cf352000b..d26d41f57a2 100644
--- a/inference-engine/thirdparty/clDNN/CMakeLists.txt
+++ b/inference-engine/thirdparty/clDNN/CMakeLists.txt
@@ -20,6 +20,16 @@ else()
     add_definitions(-DCLDNN_THREADING=CLDNN_THREADING_THREADPOOL)
 endif()
 
+
+if (ENABLE_ONEDNN_FOR_GPU)
+    ExternalProject_Get_property(onednn_gpu_build SOURCE_DIR)
+    ExternalProject_Get_property(onednn_gpu_build BINARY_DIR)
+
+    set(ONEDNN_TARGET_NAME onednn_gpu)
+    set(ONEDNN_INCLUDE_DIRS "${BINARY_DIR}/include/" "${SOURCE_DIR}/include/")
+    set(ONEDNN_LIBRARY "${CMAKE_LIBRARY_OUTPUT_DIRECTORY}/${CMAKE_STATIC_LIBRARY_PREFIX}onednn_gpu${CMAKE_STATIC_LIBRARY_SUFFIX}")
+endif()
+
 if(ENABLE_GPU_DEBUG_CAPS)
   add_definitions(-DGPU_DEBUG_CONFIG=1)
 endif()
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/graph/network.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/graph/network.hpp
index f46a5dd1042..53b9cad0fea 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/graph/network.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/graph/network.hpp
@@ -145,6 +145,7 @@ public:
     std::vector<primitive_id> get_all_primitive_org_ids() const;
     const program::primitives_info& get_primitives_info() const;
     const program::graph_optimizer_info& get_optimizer_passes_info() const;
+    std::map<primitive_id, primitive_id> get_ext_id_mapping() const;
     void execute_impl(const std::vector<event::ptr>& events);
 
     /// @brief Executes network and returns the list of @ref network_output.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/activation.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/activation.hpp
index 71a8c4ba2c0..b0cbe24542a 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/activation.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/activation.hpp
@@ -89,8 +89,9 @@ struct activation : public primitive_base<activation> {
                const primitive_id& input,
                activation_func activation_function,
                activation_additional_params additional_params = {0.f, 0.f},
+               const primitive_id& ext_prim_id = "",
                const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           activation_function(activation_function),
           additional_params(additional_params),
           additional_params_input("") {}
@@ -105,8 +106,9 @@ struct activation : public primitive_base<activation> {
                const primitive_id& input,
                const primitive_id& additional_params_input,
                activation_func activation_function,
+               const primitive_id& ext_prim_id = "",
                const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           activation_function(activation_function),
           additional_params({0, 0}),
           additional_params_input(additional_params_input) {}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/arg_max_min.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/arg_max_min.hpp
index 2b2ede9fecd..98bf194ef5e 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/arg_max_min.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/arg_max_min.hpp
@@ -49,9 +49,10 @@ struct arg_max_min : public primitive_base<arg_max_min> {
                 axis_name axis = axis_name::xyf,
                 sort_type sort = sort_type::sort_by_values,
                 bool values_first = false,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding(),
                 data_types output_data_type = data_types::f32)
-        : primitive_base(id, {input}, output_padding, optional_data_type {output_data_type}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type {output_data_type}),
           top_k(top_k),
           output_type(output_type),
           axis(axis),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/average_unpooling.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/average_unpooling.hpp
index 8db0a0f48f0..b507c454a81 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/average_unpooling.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/average_unpooling.hpp
@@ -32,8 +32,9 @@ struct average_unpooling : public primitive_base<average_unpooling> {
         const tensor output_size,
         const tensor& size,
         const tensor& stride,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), stride(stride), size(size), output_size(output_size) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), stride(stride), size(size), output_size(output_size) {}
 
     /// @brief Defines shift in output buffer.
     tensor stride;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/batch_to_space.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/batch_to_space.hpp
index 715b81ee0ba..566148c25e0 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/batch_to_space.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/batch_to_space.hpp
@@ -59,8 +59,9 @@ struct batch_to_space : public primitive_base<batch_to_space> {
                    const tensor& crops_begin,
                    const tensor& crops_end,
                    const tensor& out_size,
+                   const primitive_id& ext_prim_id = "",
                    const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           block_shape(block_shape),
           crops_begin(crops_begin),
           crops_end(crops_end),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/binary_convolution.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/binary_convolution.hpp
index 7942b8d5fd9..69ce6372549 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/binary_convolution.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/binary_convolution.hpp
@@ -44,8 +44,9 @@ struct binary_convolution : public primitive_base<binary_convolution> {
                        int groups = 1,
                        float pad_value = 0.0f,
                        data_types calc_precision = data_types::f32,
+                       const primitive_id& ext_prim_id = "",
                        const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type {calc_precision}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type {calc_precision}),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/border.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/border.hpp
index 17a14d6d363..529ec0d4cd5 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/border.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/border.hpp
@@ -67,8 +67,9 @@ struct border : public primitive_base<border> {
            const tensor& right_bottom_sizes = {0, 0, 0, 0},
            const border_type type = border_type::constant,
            const float border_value = 0.0f,
+           const primitive_id& ext_prim_id = "",
            const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           left_top_sizes(left_top_sizes),
           right_bottom_sizes(right_bottom_sizes),
           type(type),
@@ -90,7 +91,7 @@ struct border : public primitive_base<border> {
            const tensor& x_y_sizes,
            const border_type type = border_type::constant,
            const padding& output_padding = padding())
-        : border(id, input, x_y_sizes, x_y_sizes, type, 0.0f, output_padding) {}
+        : border(id, input, x_y_sizes, x_y_sizes, type, 0.0f, ext_prim_id, output_padding) {}
 
     /// @brief Sizes of border that needs to be added from left (in X dimension) and from top (in Y dimension).
     tensor left_top_sizes;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/broadcast.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/broadcast.hpp
index f7140648d78..f6931236bd9 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/broadcast.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/broadcast.hpp
@@ -75,8 +75,9 @@ struct broadcast : public primitive_base<broadcast> {
               const primitive_id& input,
               const tensor& broadcast_sizes,
               const std::vector<uint16_t>& broadcast_axes = {},
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           broadcast_sizes(broadcast_sizes),
           broadcast_axes(broadcast_axes) {}
 
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/concatenation.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/concatenation.hpp
index b8e2118675d..8c0199cf56f 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/concatenation.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/concatenation.hpp
@@ -57,8 +57,9 @@ struct concatenation : public primitive_base<concatenation> {
         const primitive_id& id,
         const std::vector<primitive_id>& input,
         const concatenation_axis axis,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), axis(axis) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), axis(axis) {}
 
     /// @li Constructs concatenation primitive.
     /// @param id This primitive id.
@@ -70,8 +71,9 @@ struct concatenation : public primitive_base<concatenation> {
         const std::vector<primitive_id>& input,
         const concatenation_axis axis,
         const data_types output_dt,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{output_dt}), axis(axis) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_dt}), axis(axis) {}
 
     /// @brief Dimension along which concatenation should take place
     concatenation_axis axis;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/condition.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/condition.hpp
index aa63586c4a3..791522d3254 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/condition.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/condition.hpp
@@ -47,8 +47,9 @@ struct condition : public primitive_base<condition> {
               const primitive_id& compare_data,
               const cond_functions& func,
               const tensor& offset = {0, 0, 0, 0, 0},
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           topology_true(topology_true),
           topology_false(topology_false),
           compare_data(compare_data),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/convolution.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/convolution.hpp
index 0a34c6ba506..b608f31dbee 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/convolution.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/convolution.hpp
@@ -53,8 +53,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor output_size,
                 data_types output_type,
                 bool grouped_weights_shape,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-            : primitive_base(id, {input}, output_padding, optional_data_type{output_type}),
+            : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_type}),
               input_offset(input_offset),
               stride(stride),
               dilation(dilation),
@@ -104,8 +105,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor output_size,
                 bool grouped_weights_shape,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-            : primitive_base(id, {input}, output_padding, optional_data_type{output_data_type}),
+            : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_data_type}),
               input_offset(input_offset),
               stride(stride),
               dilation(dilation),
@@ -162,8 +164,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor output_size,
                 bool grouped_weights_shape,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-            : primitive_base(id, {input}, output_padding, optional_data_type{output_data_type}),
+            : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_data_type}),
               input_offset(input_offset),
               stride(stride),
               dilation(dilation),
@@ -209,8 +212,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor stride = {1, 1, 1, 1},
                 tensor input_offset = tensor(0),
                 tensor dilation = {1, 1, 1, 1},
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -254,8 +258,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor padding_above,
                 tensor padding_below,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -301,8 +306,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor padding_above,
                 tensor padding_below,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -347,8 +353,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset = tensor(0),
                 tensor dilation = {1, 1, 1, 1},
                 bool grouped_weights_shape = false,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -391,8 +398,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset = tensor(0),
                 tensor dilation = {1, 1, 1, 1},
                 bool grouped_weights_shape = false,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -433,8 +441,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor padding_above,
                 tensor padding_below,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -477,8 +486,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor padding_above,
                 tensor padding_below,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -518,8 +528,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset = tensor(0),
                 tensor dilation = {1, 1, 1, 1},
                 bool grouped_weights_shape = false,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -560,8 +571,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset,
                 tensor dilation,
                 tensor output_size,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -604,8 +616,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset,
                 tensor dilation,
                 tensor output_size,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -652,8 +665,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset,
                 tensor dilation,
                 tensor output_size,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input, trans}, output_padding),
+        : primitive_base(id, {input, trans}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -701,6 +715,7 @@ struct convolution : public primitive_base<convolution> {
                                                tensor stride = {1, 1, 1, 1},
                                                tensor input_offset = tensor(0),
                                                tensor dilation = {1, 1, 1, 1},
+                                               const primitive_id& ext_prim_id = "",
                                                const padding& output_padding = padding()) {
         return convolution(id,
                            input,
@@ -710,6 +725,7 @@ struct convolution : public primitive_base<convolution> {
                            input_offset,
                            dilation,
                            output_size,
+                           ext_prim_id,
                            output_padding);
     }
 
@@ -736,6 +752,7 @@ struct convolution : public primitive_base<convolution> {
                                                tensor stride = {1, 1, 1, 1},
                                                tensor input_offset = tensor(0),
                                                tensor dilation = {1, 1, 1, 1},
+                                               const primitive_id& ext_prim_id = "",
                                                const padding& output_padding = padding()) {
         return convolution(id,
                            input,
@@ -744,6 +761,7 @@ struct convolution : public primitive_base<convolution> {
                            input_offset,
                            dilation,
                            output_size,
+                           ext_prim_id,
                            output_padding);
     }
 
@@ -813,8 +831,9 @@ struct deformable_interp : public primitive_base<deformable_interp> {
                       tensor dilation,
                       tensor output_size,
                       tensor kernel_size,
+                      const primitive_id& ext_prim_id = "",
                       const padding& output_padding = padding())
-            : primitive_base(id, {input, trans}, output_padding),
+            : primitive_base(id, {input, trans}, ext_prim_id, output_padding),
               input_offset(input_offset),
               stride(stride),
               dilation(dilation),
@@ -857,8 +876,9 @@ struct deformable_conv : public primitive_base<deformable_conv> {
                     const std::vector<primitive_id>& biases,
                     uint32_t groups,
                     tensor output_size,
+                    const primitive_id& ext_prim_id = "",
                     const padding& output_padding = padding())
-            : primitive_base(id, {input}, output_padding),
+            : primitive_base(id, {input}, ext_prim_id, output_padding),
               output_size(output_size),
               groups(groups),
               weights(weights),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/crop.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/crop.hpp
index ff14ad1e94f..ee87c285211 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/crop.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/crop.hpp
@@ -51,8 +51,9 @@ struct crop : public primitive_base<crop> {
          const primitive_id& input,
          const tensor& reference_input,
          const tensor& offsets,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), reference_input(reference_input), offsets(offsets) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), reference_input(reference_input), offsets(offsets) {}
 
     /// @brief Constructs crop primitive (borders variant).
     ///
@@ -71,8 +72,9 @@ struct crop : public primitive_base<crop> {
          const tensor& lt_borders,
          const tensor& rb_borders,
          const crop_borders_t,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), reference_input(rb_borders.negate()), offsets(lt_borders) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), reference_input(rb_borders.negate()), offsets(lt_borders) {}
 
     /// @brief Constructs crop primitive (symmetric borders variant).
     ///
@@ -88,8 +90,9 @@ struct crop : public primitive_base<crop> {
          const primitive_id& input,
          const tensor& xy_borders,
          const crop_borders_t,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), reference_input(xy_borders.negate()), offsets(xy_borders) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), reference_input(xy_borders.negate()), offsets(xy_borders) {}
 
     /// @brief Reference input tensor with the required dimensions.
     tensor reference_input;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/ctc_greedy_decoder.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/ctc_greedy_decoder.hpp
index 2ec0f84c27b..d5deedeaeaf 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/ctc_greedy_decoder.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/ctc_greedy_decoder.hpp
@@ -28,8 +28,9 @@ struct ctc_greedy_decoder : public primitive_base<ctc_greedy_decoder> {
                        const uint32_t blank_index,
                        const bool ctc_merge_repeated,
                        const tensor output_tensor,
+                       const primitive_id& ext_prim_id = "",
                        const padding& output_padding = padding())
-        : primitive_base(id, input, output_padding)
+        : primitive_base(id, input, ext_prim_id, output_padding)
         , blank_index(blank_index)
         , ctc_merge_repeated(ctc_merge_repeated)
         , output_tensor(output_tensor) {}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/cum_sum.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/cum_sum.hpp
index 8a0847fd61f..5740fa445af 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/cum_sum.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/cum_sum.hpp
@@ -37,8 +37,9 @@ struct cum_sum : public primitive_base<cum_sum> {
             const cum_sum_axis axis = along_b,
             const bool exclusive = false,
             const bool reverse = false,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), axis(axis), exclusive(exclusive), reverse(reverse)
+        : primitive_base(id, {input}, ext_prim_id, output_padding), axis(axis), exclusive(exclusive), reverse(reverse)
     {}
 
     /// @brief Scalar axis.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/custom_gpu_primitive.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/custom_gpu_primitive.hpp
index 25da079a5de..163f7276319 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/custom_gpu_primitive.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/custom_gpu_primitive.hpp
@@ -56,8 +56,9 @@ struct custom_gpu_primitive : public primitive_base<custom_gpu_primitive> {
                          const std::string& build_options,
                          const layout& output_layout,
                          const std::vector<size_t>& gws = {},
-                         const std::vector<size_t>& lws = {})
-        : primitive_base(id, {input}, output_layout.data_padding),
+                         const std::vector<size_t>& lws = {},
+                         const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {input}, ext_prim_id, output_layout.data_padding),
           kernel_entry_point(kernel_entry_point),
           kernel_arguments(kernel_arguments),
           build_options(build_options),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/data.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/data.hpp
index e7fe1f889fc..571175d4d04 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/data.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/data.hpp
@@ -26,8 +26,8 @@ struct data : public primitive_base<data> {
     /// @param id This primitive id.
     /// @param mem @ref memory object which contains data.
     /// @note If memory is attached by memory::attach(), the attached buffer should be valid till network build.
-    data(const primitive_id& id, memory::ptr mem)
-        : primitive_base(id, {}, padding()), mem(mem) {}
+    data(const primitive_id& id, memory::ptr mem, const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {}, ext_prim_id, padding()), mem(mem) {}
 
     /// @brief @ref memory object which contains data.
     /// @note If memory is attached by memory::attach(), the attached buffer should be valid till network build.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/deconvolution.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/deconvolution.hpp
index 333488d6297..2bc753553c0 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/deconvolution.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/deconvolution.hpp
@@ -37,8 +37,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   const std::vector<primitive_id>& bias,
                   tensor stride = {1, 1, 1, 1},
                   tensor input_offset = {0, 0, 0, 0},
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(false),
@@ -64,8 +65,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   uint32_t groups,
                   tensor stride = {1, 1, 1, 1},
                   tensor input_offset = {0, 0, 0, 0},
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(false),
@@ -88,8 +90,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   const std::vector<primitive_id>& weights,
                   tensor stride = {1, 1, 1, 1},
                   tensor input_offset = {0, 0, 0, 0},
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(false),
@@ -114,8 +117,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   uint32_t groups,
                   tensor stride = {1, 1, 1, 1},
                   tensor input_offset = {0, 0, 0, 0},
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(false),
@@ -142,8 +146,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   tensor stride,
                   tensor input_offset,
                   tensor output_size,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(true),
@@ -174,8 +179,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   tensor input_offset,
                   tensor output_size,
                   bool grouped_weights_shape,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(true),
@@ -201,8 +207,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   tensor stride,
                   tensor input_offset,
                   tensor output_size,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(true),
@@ -231,6 +238,7 @@ struct deconvolution : public primitive_base<deconvolution> {
                                                  tensor output_size,
                                                  tensor stride = {1, 1, 1, 1},
                                                  tensor input_offset = {0, 0, 0, 0},
+                                                 const primitive_id& ext_prim_id = "",
                                                  const padding& output_padding = padding()) {
         return deconvolution(id,
                              input,
@@ -239,6 +247,7 @@ struct deconvolution : public primitive_base<deconvolution> {
                              stride,
                              input_offset,
                              output_size,
+                             ext_prim_id,
                              output_padding);
     }
 
@@ -259,6 +268,7 @@ struct deconvolution : public primitive_base<deconvolution> {
                                                  tensor output_size,
                                                  tensor stride = {1, 1, 1, 1},
                                                  tensor input_offset = {0, 0, 0, 0},
+                                                 const primitive_id& ext_prim_id = "",
                                                  const padding& output_padding = padding()) {
         return deconvolution(id,
                              input,
@@ -266,6 +276,7 @@ struct deconvolution : public primitive_base<deconvolution> {
                              stride,
                              input_offset,
                              output_size,
+                             ext_prim_id,
                              output_padding);
     }
 
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/depth_to_space.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/depth_to_space.hpp
index 74b824a670d..70cc035f6b1 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/depth_to_space.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/depth_to_space.hpp
@@ -36,8 +36,9 @@ struct depth_to_space : public primitive_base<depth_to_space> {
                    const primitive_id& input,
                    const size_t block_size,
                    const depth_to_space_mode mode,
+                   const primitive_id& ext_prim_id = "",
                    const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding)
+        : primitive_base(id, {input}, ext_prim_id, output_padding)
         , block_size(block_size)
         , mode(mode) {}
 
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/detection_output.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/detection_output.hpp
index 22f7d686c0f..a46f0cd0b81 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/detection_output.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/detection_output.hpp
@@ -65,8 +65,9 @@ struct detection_output : public primitive_base<detection_output> {
                      const bool decrease_label_id = false,
                      const bool clip_before_nms = false,
                      const bool clip_after_nms = false,
+                     const primitive_id& ext_prim_id = "",
                      const padding& output_padding = padding())
-        : primitive_base(id, {input_location, input_confidence, input_prior_box}, output_padding),
+        : primitive_base(id, {input_location, input_confidence, input_prior_box}, ext_prim_id, output_padding),
           num_classes(num_classes),
           keep_top_k(keep_top_k),
           share_location(share_location),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/eltwise.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/eltwise.hpp
index 459377fdf12..35725348ada 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/eltwise.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/eltwise.hpp
@@ -78,8 +78,9 @@ struct eltwise : public primitive_base<eltwise> {
             const primitive_id& input,
             const primitive_id& input2,
             eltwise_mode mode,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input, input2}, output_padding),
+        : primitive_base(id, {input, input2}, ext_prim_id, output_padding),
           mode(mode),
           coefficients(std::vector<float>(0)),
           stride(std::vector<tensor>(0)) {}
@@ -97,8 +98,9 @@ struct eltwise : public primitive_base<eltwise> {
             const primitive_id& input2,
             std::vector<tensor> stride,
             eltwise_mode mode,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input, input2}, output_padding),
+        : primitive_base(id, {input, input2}, ext_prim_id, output_padding),
           mode(mode),
           coefficients(std::vector<float>(0)),
           stride(stride) {}
@@ -112,8 +114,9 @@ struct eltwise : public primitive_base<eltwise> {
             const std::vector<primitive_id>& inputs,
             eltwise_mode mode,
             data_types data_type,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, inputs, output_padding, optional_data_type{data_type}),
+        : primitive_base(id, inputs, ext_prim_id, output_padding, optional_data_type{data_type}),
           mode(mode),
           coefficients(std::vector<float>(0)),
           stride(std::vector<tensor>(0)) {}
@@ -125,8 +128,9 @@ struct eltwise : public primitive_base<eltwise> {
     eltwise(const primitive_id& id,
             const std::vector<primitive_id>& inputs,
             eltwise_mode mode,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, inputs, output_padding),
+        : primitive_base(id, inputs, ext_prim_id, output_padding),
           mode(mode),
           coefficients(std::vector<float>(0)),
           stride(std::vector<tensor>(0)) {}
@@ -141,8 +145,9 @@ struct eltwise : public primitive_base<eltwise> {
             eltwise_mode mode,
             const std::vector<float>& coefficients,
             data_types data_type,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, inputs, output_padding, optional_data_type{data_type}),
+        : primitive_base(id, inputs, ext_prim_id, output_padding, optional_data_type{data_type}),
           mode(mode),
           coefficients(coefficients),
           stride(std::vector<tensor>(0)) {
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/embedding_bag.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/embedding_bag.hpp
index 630f352c948..6788a2a20b0 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/embedding_bag.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/embedding_bag.hpp
@@ -36,8 +36,9 @@ struct embedding_bag : public primitive_base<embedding_bag> {
                   const embedding_bag_type& type,
                   const tensor& output_shape,
                   const int32_t default_index = -1,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, inputs, output_padding), type(type), output_shape(output_shape), default_index(default_index) {}
+        : primitive_base(id, inputs, ext_prim_id, output_padding), type(type), output_shape(output_shape), default_index(default_index) {}
 
     /// @brief Type of EmbeddingBag operation
     embedding_bag_type type;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/extract_image_patches.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/extract_image_patches.hpp
index 8ee28b9c846..661a99c2b70 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/extract_image_patches.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/extract_image_patches.hpp
@@ -43,8 +43,9 @@ struct extract_image_patches : public primitive_base<extract_image_patches> {
                           const std::vector<unsigned int>& rates,
                           const std::string& auto_pad,
                           const tensor& output_shape,
+                          const primitive_id& ext_prim_id = "",
                           const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           sizes(sizes),
           strides(strides),
           rates(rates),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fully_connected.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fully_connected.hpp
index 9e2a5f51b10..93ea33e80fd 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fully_connected.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fully_connected.hpp
@@ -49,9 +49,10 @@ struct fully_connected : public primitive_base<fully_connected> {
                     const primitive_id& input,
                     const primitive_id& weights,
                     const primitive_id& bias = "",
+                    const primitive_id& ext_prim_id = "",
                     const padding& output_padding = padding(),
                     const size_t input_size = 2)
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           weights(weights),
           bias(bias),
           input_size(input_size)
@@ -63,16 +64,17 @@ struct fully_connected : public primitive_base<fully_connected> {
     /// @param weights Primitive id containing weights data.
     /// @param bias Primitive id containing bias data. Provide empty string if using Relu without bias.
     fully_connected(const primitive_id& id,
-        const primitive_id& input,
-        const primitive_id& weights,
-        const primitive_id& bias,
-        const data_types data_type,
-        const padding& output_padding = padding(),
-        const size_t input_size = 2)
-        : primitive_base(id, { input }, output_padding, optional_data_type{data_type}),
-        weights(weights),
-        bias(bias),
-        input_size(input_size)
+                    const primitive_id& input,
+                    const primitive_id& weights,
+                    const primitive_id& bias,
+                    const data_types data_type,
+                    const primitive_id& ext_prim_id = "",
+                    const padding& output_padding = padding(),
+                    const size_t input_size = 2)
+        : primitive_base(id, { input }, ext_prim_id, output_padding, optional_data_type{data_type}),
+          weights(weights),
+          bias(bias),
+          input_size(input_size)
     {}
 
     /// @brief Primitive id containing weights data.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fused_conv_eltwise.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fused_conv_eltwise.hpp
index 6aed6cf6a75..306068233ae 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fused_conv_eltwise.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fused_conv_eltwise.hpp
@@ -50,9 +50,10 @@ struct fused_conv_eltwise : public primitive_base<fused_conv_eltwise> {
                        float conv_activation_slp = 0.0f,
                        bool eltw_with_activation = false,
                        float eltw_activation_slp = 0.0f,
+                       const primitive_id& ext_prim_id = "",
                        const padding& output_padding = padding(),
                        optional_data_type output_data_type = {})
-        : primitive_base(id, {input, input2}, output_padding, output_data_type),
+        : primitive_base(id, {input, input2}, ext_prim_id, output_padding, output_data_type),
           conv((primitive_id_arr)weights,
               (primitive_id_arr)bias),
           eltw(),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather.hpp
index 18bc947b1e3..ab61ecbb68b 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather.hpp
@@ -44,9 +44,10 @@ struct gather : public primitive_base<gather> {
            const tensor& output_shape,
            const int64_t batch_dim = 0,
            const bool support_neg_ind = false,
+           const primitive_id& ext_prim_id = "",
            const padding& output_padding = padding()
            )
-        : primitive_base(id, {dict, idx}, output_padding), axis(axis), output_format(output_format),
+        : primitive_base(id, {dict, idx}, ext_prim_id, output_padding), axis(axis), output_format(output_format),
                          output_shape(output_shape), batch_dim(batch_dim), support_neg_ind(support_neg_ind) {}
 
     /// @brief Gathering axis
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_elements.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_elements.hpp
index d6d0ca9fdb2..d2d994f5e69 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_elements.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_elements.hpp
@@ -41,8 +41,9 @@ struct gather_elements : public primitive_base<gather_elements> {
                     const format& output_format,
                     const tensor& output_shape,
                     const gather_elements_axis axis,
+                    const primitive_id& ext_prim_id = "",
                     const padding& output_padding = padding())
-        : primitive_base(id, {data, indices}, output_padding), output_format(output_format), output_shape(output_shape), axis(axis) {}
+        : primitive_base(id, {data, indices}, ext_prim_id, output_padding), output_format(output_format), output_shape(output_shape), axis(axis) {}
 
     /// @brief Gather Elements output format
     format output_format;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_nd.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_nd.hpp
index 885f7297510..52e2d87f11e 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_nd.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_nd.hpp
@@ -25,12 +25,13 @@ struct gather_nd : public primitive_base<gather_nd> {
     /// @param indices_rank Rank of indices.
     /// @param batch_dims batch_dims as an attribute of GatherND. Optional.
     gather_nd(const primitive_id& id,
-                   const primitive_id& data,
-                   const primitive_id& indices,
-                   const uint8_t indices_rank,
-                   const uint8_t batch_dims = 0,
-                   const padding& output_padding = padding())
-        : primitive_base(id, {data, indices}, output_padding), indices_rank(indices_rank), batch_dims(batch_dims) {}
+              const primitive_id& data,
+              const primitive_id& indices,
+              const uint8_t indices_rank,
+              const uint8_t batch_dims = 0,
+              const primitive_id& ext_prim_id = "",
+              const padding& output_padding = padding())
+        : primitive_base(id, {data, indices}, ext_prim_id, output_padding), indices_rank(indices_rank), batch_dims(batch_dims) {}
 
     /// @brief GatherND indices_rank
     uint8_t indices_rank;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_tree.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_tree.hpp
index 59e7bec1955..83cf6ccf0b9 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_tree.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_tree.hpp
@@ -31,12 +31,13 @@ struct gather_tree : public primitive_base<gather_tree> {
         ///                                a value of the end_token
         /// @param output_padding          Optional padding for output from primitive
         gather_tree(const primitive_id& id,
-            const primitive_id& step_input,
-            const primitive_id& parent_input,
-            const primitive_id& max_seq_len_input,
-            const primitive_id& end_token,
-            const padding& output_padding = padding())
-        : primitive_base(id, { step_input, parent_input, max_seq_len_input, end_token }, output_padding) {}
+                    const primitive_id& step_input,
+                    const primitive_id& parent_input,
+                    const primitive_id& max_seq_len_input,
+                    const primitive_id& end_token,
+                    const primitive_id& ext_prim_id = "",
+                    const padding& output_padding = padding())
+            : primitive_base(id, { step_input, parent_input, max_seq_len_input, end_token }, ext_prim_id, output_padding) {}
 };
     /// @}
     /// @}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gemm.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gemm.hpp
index 5bac5ceb9ce..02a2c211ce0 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gemm.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gemm.hpp
@@ -46,8 +46,9 @@ struct gemm : public primitive_base<gemm> {
          const bool transpose_input1 = false,
          const float alpha = 1.0f,
          const float beta = 0.0f,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, inputs, output_padding, optional_data_type{ data_type }),
+        : primitive_base(id, inputs, ext_prim_id, output_padding, optional_data_type{ data_type }),
           transpose_input0(transpose_input0),
           transpose_input1(transpose_input1),
           alpha(alpha),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/grn.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/grn.hpp
index 47c9cb19fa9..73b3ae9a2c8 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/grn.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/grn.hpp
@@ -26,8 +26,9 @@ struct grn : public primitive_base<grn> {
         const primitive_id& input,
         const float bias,
         const data_types data_type,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{ data_type }),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{ data_type }),
         bias(bias)
     {}
 
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/implementation_desc.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/implementation_desc.hpp
index 4ce5fcab2e8..841d9b20913 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/implementation_desc.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/implementation_desc.hpp
@@ -16,6 +16,7 @@ enum class impl_types : uint8_t {
     cpu = 1 << 0,
     common = 1 << 1,
     ocl = 1 << 2,
+    onednn = 1 << 3,
     any = 0xFF,
 };
 
@@ -39,6 +40,7 @@ inline std::ostream& operator<<(std::ostream& out, const impl_types& impl_type)
         case impl_types::cpu: out << "cpu"; break;
         case impl_types::common: out << "common"; break;
         case impl_types::ocl: out << "ocl"; break;
+        case impl_types::onednn: out << "onednn"; break;
         case impl_types::any: out << "any"; break;
         default: out << "unknown"; break;
     }
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/input_layout.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/input_layout.hpp
index c6be1bf5b39..e73b9e1cac1 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/input_layout.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/input_layout.hpp
@@ -28,8 +28,8 @@ struct input_layout : public primitive_base<input_layout> {
     /// @brief Constructs input layout primitive.
     /// @param id This primitive id.
     /// @param layout Defines layout for the data will be passed to network.
-    input_layout(const primitive_id& id, const layout& layout)
-        : primitive_base(id, {}, layout.data_padding), layout(layout) {}
+    input_layout(const primitive_id& id, const layout& layout, const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {}, ext_prim_id, layout.data_padding), layout(layout) {}
 
     /// @brief Defines layout for the data will be passed to network.
     mutable cldnn::layout layout;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/loop.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/loop.hpp
index 63215f3ad98..b888f1f9f7d 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/loop.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/loop.hpp
@@ -119,19 +119,20 @@ struct loop : public primitive_base<loop> {
     /// @param back_edges Output data primitive id.
     /// @param output_padding     Optional padding for output from primitive.
     loop(const primitive_id& id,
-        const std::vector<primitive_id>& inputs,
-        const topology& body,
-        const primitive_id& trip_count_id,
-        const primitive_id& initial_condition_id,
-        const primitive_id& num_iteration_id,
-        const std::vector<io_primitive_map>& input_primitive_maps,
-        const std::vector<io_primitive_map>& output_primitive_maps,
-        const std::vector<backedge_mapping>& back_edges,
-        int64_t max_iteration = -1,
-        const primitive_id& current_iteration_id = primitive_id(),
-        const primitive_id& condition_id = primitive_id(),
-        const padding& output_padding = padding())
-            : primitive_base(id, inputs, output_padding),
+         const std::vector<primitive_id>& inputs,
+         const topology& body,
+         const primitive_id& trip_count_id,
+         const primitive_id& initial_condition_id,
+         const primitive_id& num_iteration_id,
+         const std::vector<io_primitive_map>& input_primitive_maps,
+         const std::vector<io_primitive_map>& output_primitive_maps,
+         const std::vector<backedge_mapping>& back_edges,
+         int64_t max_iteration = -1,
+         const primitive_id& current_iteration_id = primitive_id(),
+         const primitive_id& condition_id = primitive_id(),
+         const primitive_id& ext_prim_id = "",
+         const padding& output_padding = padding())
+            : primitive_base(id, inputs, ext_prim_id, output_padding),
               body(body),
               trip_count_id(trip_count_id),
               initial_execution_id(initial_condition_id),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lrn.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lrn.hpp
index 3a24f4f70e7..306b5f809bf 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lrn.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lrn.hpp
@@ -48,8 +48,9 @@ struct lrn : public primitive_base<lrn> {
         float alpha,
         float beta,
         lrn_norm_region lrn_norm_region,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           size(size),
           k(k),
           alpha(alpha),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm.hpp
index 33c49bc7c18..585b3c289f0 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm.hpp
@@ -85,8 +85,9 @@ struct lstm : public primitive_base<lstm> {
          const std::vector<activation_additional_params> activation_params = {},
          const lstm_output_selection output_selection = lstm_output_selection::sequence,
          const lstm_weights_order offset_order = lstm_weights_order::iofz,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, input, output_padding),
+        : primitive_base(id, input, ext_prim_id, output_padding),
           weights(weights),
           recurrent(recurrent),
           bias(bias),
@@ -166,8 +167,9 @@ struct lstm_gemm : public primitive_base<lstm_gemm> {
               const primitive_id& bias = "",
               const primitive_id& hidden = "",
               const uint32_t direction = 0,
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           weights(weights),
           recurrent(recurrent),
           bias(bias),
@@ -222,8 +224,9 @@ struct lstm_elt : public primitive_base<lstm_elt> {
              const std::vector<activation_additional_params> activation_params = {},
              const lstm_weights_order offset_order = lstm_weights_order::iofz,
              const uint32_t direction = 0,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           cell(cell),
           clip(clip),
           input_forget(input_forget),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic.hpp
index 5f0d297e3cb..4a18c363ab8 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic.hpp
@@ -52,8 +52,9 @@ struct lstm_dynamic : public primitive_base<lstm_dynamic> {
                  const primitive_id& initial_cell = "",
                  const float clip = 0.0f,
                  const bool input_forget = 0,
+                 const primitive_id& ext_prim_id = "",
                  const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           dyn_length(dyn_length),
           weights(weights),
           recurrent(recurrent),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_input.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_input.hpp
index 3733a989fe6..6737267c251 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_input.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_input.hpp
@@ -39,8 +39,9 @@ struct lstm_dynamic_input : public primitive_base<lstm_dynamic_input> {
                        const primitive_id& dyn_length,
                        const primitive_id& weights,
                        const primitive_id& bias = "",
+                       const primitive_id& ext_prim_id = "",
                        const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), dyn_length(dyn_length), weights(weights), bias(bias) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), dyn_length(dyn_length), weights(weights), bias(bias) {}
 
     /// @brief Primitive id containing the dynamic sequence lengths.
     primitive_id dyn_length;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_timeloop.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_timeloop.hpp
index c7b77fb1afe..ed8a596c1e8 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_timeloop.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_timeloop.hpp
@@ -47,8 +47,9 @@ struct lstm_dynamic_timeloop
                           const primitive_id& initial_cell = "",
                           const float clip = 0.0f,
                           const bool input_forget = 0,
+                          const primitive_id& ext_prim_id = "",
                           const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           dyn_length(dyn_length),
           recurrent(recurrent),
           last_hidden_state(last_hidden_state),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/max_unpooling.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/max_unpooling.hpp
index c22852627e0..35b287deb2c 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/max_unpooling.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/max_unpooling.hpp
@@ -36,8 +36,9 @@ struct max_unpooling : public primitive_base<max_unpooling> {
                   const tensor& size,
                   const tensor& stride,
                   const tensor& input_offset = {0, 0, 0, 0},
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(argmax),
           input_offset(input_offset),
           stride(stride),
@@ -54,8 +55,9 @@ struct max_unpooling : public primitive_base<max_unpooling> {
                   const primitive_id& input,
                   const primitive_id& argmax,
                   tensor output_size,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(argmax),
           with_output_size(true),
           output_size(output_size) {}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mutable_data.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mutable_data.hpp
index a5aca1f4392..769e5655cc0 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mutable_data.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mutable_data.hpp
@@ -31,8 +31,11 @@ struct mutable_data : public primitive_base<mutable_data> {
     /// @param mem @ref memory object which contains data.
     /// @param filler_type @ref data filling function, default is zero
     /// @note If memory is attached by memory::attach(), the attached buffer should be valid till network build.
-    mutable_data(const primitive_id& id, memory::ptr mem, filler_type fill_type = filler_type::no_fill)
-        : primitive_base(id, {}, padding()), mem(mem), fill_type(fill_type) {}
+    mutable_data(const primitive_id& id,
+                 memory::ptr mem,
+                 const primitive_id& ext_prim_id = "",
+                 filler_type fill_type = filler_type::no_fill)
+        : primitive_base(id, {}, ext_prim_id, padding()), mem(mem), fill_type(fill_type) {}
 
     /// @brief Constructs mutable_data primitive with inputs.
     /// @param id This primitive id.
@@ -43,8 +46,9 @@ struct mutable_data : public primitive_base<mutable_data> {
     mutable_data(const primitive_id& id,
                  const std::vector<primitive_id>& input,
                  memory::ptr mem,
+                 const primitive_id& ext_prim_id = "",
                  filler_type fill_type = filler_type::no_fill)
-        : primitive_base(id, {input}, padding()), mem(mem), fill_type(fill_type) {}
+        : primitive_base(id, {input}, ext_prim_id, padding()), mem(mem), fill_type(fill_type) {}
 
     /// @brief @ref memory object which contains data.
     /// @note If memory is attached by memory::attach(), the attached buffer should be valid till network build.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mvn.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mvn.hpp
index 0f821debbb6..0a73bd934a4 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mvn.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mvn.hpp
@@ -32,8 +32,9 @@ struct mvn : public primitive_base<mvn> {
         const float epsilon,
         const bool eps_inside_sqrt,
         const bool across_channels = false,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           normalize_variance(normalize_variance),
           epsilon(epsilon),
           eps_inside_sqrt(eps_inside_sqrt),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/non_max_suppression.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/non_max_suppression.hpp
index ad017138248..2903c680ee7 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/non_max_suppression.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/non_max_suppression.hpp
@@ -47,8 +47,9 @@ struct non_max_suppression : public primitive_base<non_max_suppression> {
                         const primitive_id& score_threshold = primitive_id(),
                         const primitive_id& soft_nms_sigma = primitive_id(),
                         const primitive_id& second_output = primitive_id(),
-                        const primitive_id& third_output = primitive_id())
-        : primitive_base(id, {boxes_positions, boxes_score})
+                        const primitive_id& third_output = primitive_id(),
+                        const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {boxes_positions, boxes_score}, ext_prim_id)
         , selected_indices_num(selected_indices_num)
         , center_point_box(center_point_box)
         , sort_result_descending(sort_result_descending)
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/normalize.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/normalize.hpp
index 931ffb0dd38..12de706b008 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/normalize.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/normalize.hpp
@@ -47,8 +47,9 @@ struct normalize : public primitive_base<normalize> {
               const primitive_id& scale_input,
               const bool across_spatial = true,
               const float epsilon = 1e-10f,
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           scale_input(scale_input),
           across_spatial(across_spatial),
           epsilon(epsilon) {}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/one_hot.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/one_hot.hpp
index 47d27c79701..b6a3c3bd538 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/one_hot.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/one_hot.hpp
@@ -52,8 +52,9 @@ struct one_hot : public primitive_base<one_hot> {
             const uint16_t& one_hot_axis,
             const float& on_value = 1.0f,
             const float& off_value = 0.0f,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), shape(shape), one_hot_axis(one_hot_axis),
+        : primitive_base(id, {input}, ext_prim_id, output_padding), shape(shape), one_hot_axis(one_hot_axis),
           on_value(on_value), off_value(off_value) {}
 
     /// @brief Constructs one-hot primitive layer.
@@ -70,8 +71,9 @@ struct one_hot : public primitive_base<one_hot> {
             const uint16_t& one_hot_axis,
             const float& on_value = 1.0f,
             const float& off_value = 0.0f,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{output_dt}), shape(shape), one_hot_axis(one_hot_axis),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_dt}), shape(shape), one_hot_axis(one_hot_axis),
           on_value(on_value), off_value(off_value) {}
 
     /// @brief Output size reference.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/permute.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/permute.hpp
index db4f1b764c4..9a8fe93283d 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/permute.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/permute.hpp
@@ -33,8 +33,9 @@ struct permute : public primitive_base<permute> {
     permute(const primitive_id& id,
             const primitive_id& input,
             const std::vector<uint16_t>& permute_order = {},
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), permute_order(permute_order) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), permute_order(permute_order) {}
 
     /// @brief Array of permuted output order in bfyx format.
     std::vector<uint16_t> permute_order;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pooling.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pooling.hpp
index 6975b1918d2..11f552efe36 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pooling.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pooling.hpp
@@ -49,8 +49,9 @@ struct pooling : public primitive_base<pooling> {
             const tensor& size,
             const tensor& stride,
             const tensor& input_offset = {0, 0, 0, 0},
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(""),
           mode(static_cast<pooling_mode>(mode)),
           global_pooling(false),
@@ -61,6 +62,7 @@ struct pooling : public primitive_base<pooling> {
 
     /// @brief Constructs pooling primitive with argmax.
     /// @param id This primitive id.
+    /// @param ext_prim_id
     /// @param input Input primitive id.
     /// @param argmax Primitive id which contains indices of each max pooling region.
     /// Indices must be in flattened bfyx format with no padding. Needs to be fp32 data type.
@@ -76,8 +78,9 @@ struct pooling : public primitive_base<pooling> {
             const tensor& size,
             const tensor& stride,
             const tensor& input_offset = {0, 0, 0, 0},
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(argmax),
           mode(static_cast<pooling_mode>(mode)),
           global_pooling(false),
@@ -102,8 +105,9 @@ struct pooling : public primitive_base<pooling> {
             const tensor& input_offset,
             tensor output_size,
             const data_types output_data_type,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{output_data_type}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_data_type}),
           argmax(""),
           mode(static_cast<pooling_mode>(mode)),
           global_pooling(false),
@@ -131,8 +135,9 @@ struct pooling : public primitive_base<pooling> {
             const tensor& stride,
             const tensor& input_offset,
             tensor output_size,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(argmax),
           mode(static_cast<pooling_mode>(mode)),
           global_pooling(false),
@@ -149,8 +154,9 @@ struct pooling : public primitive_base<pooling> {
     pooling(const primitive_id& id,
             const primitive_id& input,
             pooling_mode mode,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(""),
           mode(static_cast<pooling_mode>(mode)),
           global_pooling(true),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/primitive.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/primitive.hpp
index 856df2e5649..c57b07789a1 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/primitive.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/primitive.hpp
@@ -38,10 +38,12 @@ public:
     primitive(const primitive_type_id& type,
               const primitive_id& id,
               const std::vector<primitive_id>& input,
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding(),
               const optional_data_type output_data_type = optional_data_type())
         : type(type),
           id(id),
+          ext_prim_id(ext_prim_id),
           output_padding(output_padding),
           output_data_type(output_data_type),
           input(input) {}
@@ -79,6 +81,9 @@ public:
     /// @brief Primitive's id.
     const primitive_id id;
 
+    /// @brief Primitive's external id.
+    const primitive_id ext_prim_id;
+
     /// @brief Requested output padding.
     padding output_padding;
 
@@ -104,9 +109,10 @@ class primitive_base : public primitive {
 protected:
     explicit primitive_base(const primitive_id& id,
                             const std::vector<primitive_id>& input,
+                            const primitive_id& ext_prim_id = "",
                             const padding& output_padding = padding(),
                             optional_data_type output_data_type = optional_data_type())
-        : primitive(PType::type_id(), id, input, output_padding, output_data_type) {}
+        : primitive(PType::type_id(), id, input, ext_prim_id, output_padding, output_data_type) {}
 };
 
 struct primitive_info {
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/prior_box.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/prior_box.hpp
index 5d384948308..d9caf35612c 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/prior_box.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/prior_box.hpp
@@ -55,8 +55,9 @@ struct prior_box : public primitive_base<prior_box> {
               const std::vector<float>& fixed_ratio = {},
               const std::vector<float>& fixed_size = {},
               const std::vector<float>& density = {},
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           img_size(img_size),
           min_sizes(min_sizes),
           max_sizes(max_sizes),
@@ -113,8 +114,9 @@ struct prior_box : public primitive_base<prior_box> {
               const std::vector<float>& widths,
               const std::vector<float>& heights,
               data_types output_dt,
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{output_dt}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_dt}),
           img_size(img_size),
           flip(false),
           clip(clip),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/proposal.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/proposal.hpp
index bce518b8843..ceac3583641 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/proposal.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/proposal.hpp
@@ -33,8 +33,9 @@ struct proposal : public primitive_base<proposal> {
              int post_nms_topn,
              const std::vector<float>& ratios_param,
              const std::vector<float>& scales_param,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {cls_scores, bbox_pred, image_info}, output_padding),
+        : primitive_base(id, {cls_scores, bbox_pred, image_info}, ext_prim_id, output_padding),
           max_proposals(max_proposals),
           iou_threshold(iou_threshold),
           base_bbox_size(16),
@@ -80,8 +81,9 @@ struct proposal : public primitive_base<proposal> {
              bool round_ratios,
              bool shift_anchors,
              bool normalize,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {cls_scores, bbox_pred, image_info}, output_padding),
+        : primitive_base(id, {cls_scores, bbox_pred, image_info}, ext_prim_id, output_padding),
           max_proposals(max_proposals),
           iou_threshold(iou_threshold),
           base_bbox_size(base_bbox_size),
@@ -128,8 +130,9 @@ struct proposal : public primitive_base<proposal> {
              bool round_ratios,
              bool shift_anchors,
              bool normalize,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-            : primitive_base(id, {cls_scores, bbox_pred, image_info, second_output}, output_padding),
+            : primitive_base(id, {cls_scores, bbox_pred, image_info, second_output}, ext_prim_id, output_padding),
               max_proposals(max_proposals),
               iou_threshold(iou_threshold),
               base_bbox_size(base_bbox_size),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pyramid_roi_align.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pyramid_roi_align.hpp
index b5272218d99..b07556d1425 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pyramid_roi_align.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pyramid_roi_align.hpp
@@ -40,19 +40,21 @@ struct pyramid_roi_align : public primitive_base<pyramid_roi_align> {
     /// @param sampling_ratio Number of sampling points per output value.
     /// @param pyramid_scales Scales of each level of pyramid in relation to original image.
     /// @param pyramid_starting_level Starting level of the pyramid that should be used for region of whole image.
-    pyramid_roi_align(const primitive_id &id,
-                      const primitive_id &rois,
-                      const primitive_id &P2,
-                      const primitive_id &P3,
-                      const primitive_id &P4,
-                      const primitive_id &P5,
+    pyramid_roi_align(const primitive_id& id,
+                      const primitive_id& rois,
+                      const primitive_id& P2,
+                      const primitive_id& P3,
+                      const primitive_id& P4,
+                      const primitive_id& P5,
                       int output_size,
                       int sampling_ratio,
                       std::vector<int> pyramid_scales,
                       int pyramid_starting_level,
+                      const primitive_id& ext_prim_id = "",
                       const padding &output_padding = padding())
         : primitive_base(id,
-                         { rois, P2, P3, P4, P5},
+                         { rois, P2, P3, P4, P5 },
+                         ext_prim_id,
                          output_padding)
         , output_size(output_size)
         , sampling_ratio(sampling_ratio)
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/quantize.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/quantize.hpp
index 5073641b1b7..225e773bb85 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/quantize.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/quantize.hpp
@@ -31,8 +31,9 @@ struct quantize : public primitive_base<quantize> {
              const primitive_id& output_high,
              const int levels,
              const data_types output_data_type,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {input, input_low, input_high, output_low, output_high}, output_padding, optional_data_type{output_data_type})
+        : primitive_base(id, {input, input_low, input_high, output_low, output_high}, ext_prim_id, output_padding, optional_data_type{output_data_type})
         , levels(levels) {}
 
     /// @brief levels The number of quantization levels.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reduce.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reduce.hpp
index eadaeca114a..6abf72059d7 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reduce.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reduce.hpp
@@ -62,9 +62,14 @@ struct reduce : public primitive_base<reduce> {
     /// @param id This primitive id
     /// @param input Input primitive id
     /// @param keep_dims The axes which reduced
-    reduce(const primitive_id& id, const primitive_id& input, const reduce_mode mode, const std::vector<uint16_t> axes,
-           const int32_t keep_dims, const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), mode(mode), axes(axes), keep_dims(keep_dims) {}
+    reduce(const primitive_id& id,
+           const primitive_id& input,
+           const reduce_mode mode,
+           const std::vector<uint16_t> axes,
+           const int32_t keep_dims,
+           const primitive_id& ext_prim_id = "",
+           const padding& output_padding = padding())
+        : primitive_base(id, {input}, ext_prim_id, output_padding), mode(mode), axes(axes), keep_dims(keep_dims) {}
 
     /// @brief Reduce operation type
     reduce_mode mode;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/region_yolo.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/region_yolo.hpp
index f36b31fc96d..384a95acf77 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/region_yolo.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/region_yolo.hpp
@@ -32,8 +32,9 @@ struct region_yolo : public primitive_base<region_yolo> {
                 const uint32_t num,
                 const uint32_t mask_size = 0,
                 const bool do_softmax = true,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           coords(coords),
           classes(classes),
           num(num),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorder.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorder.hpp
index c980c34f0d4..feb7a6d0afa 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorder.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorder.hpp
@@ -40,8 +40,9 @@ struct reorder : public primitive_base<reorder> {
             const primitive_id& input,
             const layout& output_layout,
             const std::vector<float>& values_to_subtract = {},
-            const reorder_mean_mode mode = reorder_mean_mode::subtract)
-        : primitive_base(id, {input}, output_layout.data_padding, optional_data_type {output_layout.data_type}),
+            const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {input}, ext_prim_id, output_layout.data_padding, optional_data_type {output_layout.data_type}),
           output_format(output_layout.format),
           mean(""),
           subtract_per_feature(values_to_subtract),
@@ -56,8 +57,9 @@ struct reorder : public primitive_base<reorder> {
             const primitive_id& input,
             const layout& output_layout,
             primitive_id const& mean,
-            const reorder_mean_mode mode = reorder_mean_mode::subtract)
-        : primitive_base(id, {input}, output_layout.data_padding, optional_data_type {output_layout.data_type}),
+            const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {input}, ext_prim_id, output_layout.data_padding, optional_data_type {output_layout.data_type}),
           output_format(output_layout.format),
           mean(mean),
           subtract_per_feature(0),
@@ -74,8 +76,9 @@ struct reorder : public primitive_base<reorder> {
             data_types output_data_type,
             const std::vector<float>& values_to_subtract = {},
             const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{output_data_type}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_data_type}),
           output_format(output_format),
           mean(""),
           subtract_per_feature(values_to_subtract),
@@ -92,8 +95,9 @@ struct reorder : public primitive_base<reorder> {
             data_types output_data_type,
             primitive_id const& mean,
             const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type {output_data_type}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type {output_data_type}),
           output_format(output_format),
           mean(mean),
           subtract_per_feature(0),
@@ -106,12 +110,13 @@ struct reorder : public primitive_base<reorder> {
     /// @param output_layout Requested memory layout.
     /// @param values_to_subtract Array of mean subtract values.
     reorder(const primitive_id& id,
-        const primitive_id& input,
-        const primitive_id& input2,
-        const layout& output_layout,
-        const std::vector<float>& values_to_subtract = {},
-        const reorder_mean_mode mode = reorder_mean_mode::subtract)
-        : primitive_base(id, { input, input2 }, output_layout.data_padding, optional_data_type { output_layout.data_type }),
+            const primitive_id& input,
+            const primitive_id& input2,
+            const layout& output_layout,
+            const std::vector<float>& values_to_subtract = {},
+            const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "")
+        : primitive_base(id, { input, input2 }, ext_prim_id, output_layout.data_padding, optional_data_type { output_layout.data_type }),
           output_format(output_layout.format),
           mean(""),
           subtract_per_feature(values_to_subtract),
@@ -124,12 +129,13 @@ struct reorder : public primitive_base<reorder> {
     /// @param output_layout Requested memory layout.
     /// @param mean Primitive id to get mean subtract values.
     reorder(const primitive_id& id,
-        const primitive_id& input,
-        const primitive_id& input2,
-        const layout& output_layout,
-        primitive_id const& mean,
-        const reorder_mean_mode mode = reorder_mean_mode::subtract)
-        : primitive_base(id, { input, input2 }, output_layout.data_padding, optional_data_type{ output_layout.data_type }),
+            const primitive_id& input,
+            const primitive_id& input2,
+            const layout& output_layout,
+            primitive_id const& mean,
+            const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "")
+        : primitive_base(id, { input, input2 }, ext_prim_id, output_layout.data_padding, optional_data_type{ output_layout.data_type }),
         output_format(output_layout.format),
         mean(mean),
         mean_mode(mode) {}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorg_yolo.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorg_yolo.hpp
index 1993cc13b88..6f286646f10 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorg_yolo.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorg_yolo.hpp
@@ -28,8 +28,9 @@ struct reorg_yolo : public primitive_base<reorg_yolo> {
     reorg_yolo(const primitive_id& id,
                const primitive_id& input,
                const uint32_t stride,
+               const primitive_id& ext_prim_id = "",
                const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), stride(stride) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), stride(stride) {}
 
     /// @brief Defines a scope of a reorg yolo normalization
     /// @details
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/resample.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/resample.hpp
index ffeed3b0cf2..c1c18c834c3 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/resample.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/resample.hpp
@@ -93,8 +93,9 @@ struct resample : public primitive_base<resample> {
              tensor output_size,
              uint32_t num_filter,
              resample_type operation_type = resample_type::nearest,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           output_size(output_size),
           num_filter(num_filter),
           axesAndScales({}),
@@ -126,8 +127,9 @@ struct resample : public primitive_base<resample> {
              std::vector<int32_t> pads_end = {},
              int32_t align_corners = 1,
              resample_type operation_type = resample_type::bilinear,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           output_size(output_size),
           num_filter(0),
           axesAndScales({}),
@@ -158,8 +160,9 @@ struct resample : public primitive_base<resample> {
              shape_calculation_mode shape_calc_mode = shape_calculation_mode::sizes,
              coordinate_transformation_mode ctm = coordinate_transformation_mode::half_pixel,
              nearest_mode nm = nearest_mode::round_prefer_floor,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           output_size(output_size),
           num_filter(0),
           axesAndScales(axesAndScales),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reshape.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reshape.hpp
index 5c14fb68ad8..8335fea5cbf 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reshape.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reshape.hpp
@@ -32,8 +32,9 @@ struct reshape : public primitive_base<reshape> {
     reshape(const primitive_id& id,
             const primitive_id& input,
             const tensor& output_shape,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), output_shape(output_shape) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), output_shape(output_shape) {}
 
     /// @brief Requested memory shape.
     tensor output_shape;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reverse_sequence.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reverse_sequence.hpp
index c0007868b8a..e05a3b9159e 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reverse_sequence.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reverse_sequence.hpp
@@ -31,8 +31,9 @@ struct reverse_sequence : public primitive_base<reverse_sequence> {
                      const primitive_id& seq_lengths,
                      const int32_t seq_axis,
                      const int32_t batch_axis = 0,
+                     const primitive_id& ext_prim_id = "",
                      const padding& output_padding = padding())
-        : primitive_base(id, {input, seq_lengths}, output_padding), seq_axis(seq_axis), batch_axis(batch_axis) {
+        : primitive_base(id, {input, seq_lengths}, ext_prim_id, output_padding), seq_axis(seq_axis), batch_axis(batch_axis) {
         const int32_t number_of_dims = 4;
 
         int32_t batch_a = batch_axis;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/roi_pooling.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/roi_pooling.hpp
index ef1e101e97c..c57cea446c0 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/roi_pooling.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/roi_pooling.hpp
@@ -30,8 +30,9 @@ struct roi_pooling : public primitive_base<roi_pooling> {
                 int output_dim = 0,
                 int spatial_bins_x = 1,
                 int spatial_bins_y = 1,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input_data, input_rois}, output_padding),
+        : primitive_base(id, {input_data, input_rois}, ext_prim_id, output_padding),
           mode(mode),
           position_sensitive(position_sensitive),
           pooled_width(pooled_width),
@@ -59,8 +60,9 @@ struct roi_pooling : public primitive_base<roi_pooling> {
                 int output_dim = 0,
                 int spatial_bins_x = 1,
                 int spatial_bins_y = 1,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {inputs}, output_padding),
+        : primitive_base(id, {inputs}, ext_prim_id, output_padding),
           mode(mode),
           position_sensitive(position_sensitive),
           pooled_width(pooled_width),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scale.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scale.hpp
index 1d8d3340061..8dbb13247bb 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scale.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scale.hpp
@@ -40,8 +40,9 @@ struct scale : public primitive_base<scale> {
           const primitive_id& scale_input,  // should be bfyx or yxfb, where each dimension can be 1, if all dimensions
                                             // are 1 then this is scalar
           const optional_data_type& output_dt = {},
+          const primitive_id& ext_prim_id = "",
           const padding& output_padding = padding())
-        : primitive_base(id, {input, scale_input}, output_padding, output_dt), bias("") {}
+        : primitive_base(id, {input, scale_input}, ext_prim_id, output_padding, output_dt), bias("") {}
 
     /// @brief Constructs scale primitive with optional adding bias.
     /// @param id This primitive id.
@@ -54,8 +55,9 @@ struct scale : public primitive_base<scale> {
                                             // are 1 then this is scalar
           const primitive_id& bias,  // should be same size as scale_input
           const optional_data_type& output_dt = {},
+          const primitive_id& ext_prim_id = "",
           const padding& output_padding = padding())
-        : primitive_base(id, {input, scale_input}, output_padding, output_dt), bias(bias) {}
+        : primitive_base(id, {input, scale_input}, ext_prim_id, output_padding, output_dt), bias(bias) {}
 
     /// @brief Primitive id containing bias data.
     primitive_id bias;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_elements_update.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_elements_update.hpp
index e99a46ea2e2..cd65fd16d2d 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_elements_update.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_elements_update.hpp
@@ -35,12 +35,13 @@ struct scatter_elements_update : public primitive_base<scatter_elements_update>
     /// @param idupd Input updates primitive id.
     /// @param axis Gathering axis.
     scatter_elements_update(const primitive_id& id,
-                   const primitive_id& data,
-                   const primitive_id& idx,
-                   const primitive_id& idupd,
-                   const scatter_elements_update_axis axis,
-                   const padding& output_padding = padding())
-        : primitive_base(id, {data, idx, idupd}, output_padding), axis(axis) {}
+                            const primitive_id& data,
+                            const primitive_id& idx,
+                            const primitive_id& idupd,
+                            const scatter_elements_update_axis axis,
+                            const primitive_id& ext_prim_id = "",
+                            const padding& output_padding = padding())
+        : primitive_base(id, {data, idx, idupd}, ext_prim_id, output_padding), axis(axis) {}
 
     /// @brief ScatterElementsUpdate axis
     scatter_elements_update_axis axis;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_nd_update.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_nd_update.hpp
index e36e2b373c2..bf31b746ac2 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_nd_update.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_nd_update.hpp
@@ -26,12 +26,13 @@ struct scatter_nd_update : public primitive_base<scatter_nd_update> {
     /// @param idupd Input updates primitive id.
     /// @param indices_rank Rank of indices.
     scatter_nd_update(const primitive_id& id,
-                   const primitive_id& data,
-                   const primitive_id& idx,
-                   const primitive_id& idupd,
-                   const size_t indices_rank,
-                   const padding& output_padding = padding())
-        : primitive_base(id, {data, idx, idupd}, output_padding), indices_rank(indices_rank) {}
+                      const primitive_id& data,
+                      const primitive_id& idx,
+                      const primitive_id& idupd,
+                      const size_t indices_rank,
+                      const primitive_id& ext_prim_id = "",
+                      const padding& output_padding = padding())
+        : primitive_base(id, {data, idx, idupd}, ext_prim_id, output_padding), indices_rank(indices_rank) {}
 
     /// @brief ScatterNDUpdate indices_rank
     size_t indices_rank;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_update.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_update.hpp
index a28063b8f4c..7969a2ae624 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_update.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_update.hpp
@@ -39,8 +39,9 @@ struct scatter_update : public primitive_base<scatter_update> {
                    const primitive_id& idx,
                    const primitive_id& idupd,
                    const scatter_update_axis axis,
+                   const primitive_id& ext_prim_id = "",
                    const padding& output_padding = padding())
-        : primitive_base(id, {dict, idx, idupd}, output_padding), axis(axis) {}
+        : primitive_base(id, {dict, idx, idupd}, ext_prim_id, output_padding), axis(axis) {}
 
     /// @brief ScatterUpdate axis
     scatter_update_axis axis;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/select.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/select.hpp
index 3527318626b..d983bf1dc7f 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/select.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/select.hpp
@@ -40,9 +40,10 @@ struct select : public primitive_base<select> {
            const primitive_id& mask,
            const primitive_id& input,
            const primitive_id& input2,
+           const primitive_id& ext_prim_id = "",
            const padding& output_padding = padding(),
            const std::string& broadcast_type = "numpy")
-        : primitive_base(id, {mask, input, input2}, output_padding),
+        : primitive_base(id, {mask, input, input2}, ext_prim_id, output_padding),
           broadcast_type(broadcast_type) {}
 
     /// @brief String which determines broadcast type.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/shuffle_channels.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/shuffle_channels.hpp
index 8965a266fa5..5e27ee609f5 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/shuffle_channels.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/shuffle_channels.hpp
@@ -29,8 +29,9 @@ struct shuffle_channels : public primitive_base<shuffle_channels> {
                      const primitive_id& input,
                      const int32_t group,
                      const int32_t axis = 1,
+                     const primitive_id& ext_prim_id = "",
                      const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), group(group), axis(axis) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), group(group), axis(axis) {}
 
     /// @brief The number of groups to split the channel dimension. This number must evenly divide the channel dimension size.
     int32_t group;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/softmax.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/softmax.hpp
index 984acd62733..b6b5ca867c2 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/softmax.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/softmax.hpp
@@ -42,8 +42,9 @@ struct softmax : public primitive_base<softmax> {
     softmax(const primitive_id& id,
             const primitive_id& input,
             const dimension_t dimension = normalize_fyx,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), dimension(dimension) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), dimension(dimension) {}
 
     /// @brief Defines a scope of a single softmax normalization.
     /// @details
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_batch.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_batch.hpp
index bd10ed3e74c..a3587752ebc 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_batch.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_batch.hpp
@@ -56,8 +56,9 @@ struct space_to_batch : public primitive_base<space_to_batch> {
                    const tensor& pads_begin,
                    const tensor& pads_end,
                    const tensor& out_size,
+                   const primitive_id& ext_prim_id = "",
                    const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           block_shape(block_shape),
           pads_begin(pads_begin),
           pads_end(pads_end),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_depth.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_depth.hpp
index 1a7e6616ea4..4ef13df02de 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_depth.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_depth.hpp
@@ -63,8 +63,9 @@ struct space_to_depth : public primitive_base<space_to_depth> {
                    const primitive_id& input,
                    depth_mode mode,
                    const size_t block_size = 1,
+                   const primitive_id& ext_prim_id = "",
                    const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), mode(mode), block_size(block_size) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), mode(mode), block_size(block_size) {}
 
     /// @brief Depth mode.
     depth_mode mode;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/split.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/split.hpp
index cb69c2bad5d..d0568138fa7 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/split.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/split.hpp
@@ -46,8 +46,9 @@ struct split : public primitive_base<split> {
     split(const primitive_id& id,
           const primitive_id& input,
           const std::vector<std::pair<primitive_id, tensor> >& output_ids_offsets,
+          const primitive_id& ext_prim_id = "",
           const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           output_offsets(extract_tensor_vector(output_ids_offsets)),
           output_ids(extract_primitive_vector(output_ids_offsets)) {}
 
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/strided_slice.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/strided_slice.hpp
index 8d379d1e66b..08b762c948b 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/strided_slice.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/strided_slice.hpp
@@ -41,8 +41,9 @@ struct strided_slice : public primitive_base<strided_slice> {
                   std::vector<uint8_t> new_axis_mask,
                   std::vector<uint8_t> shrink_axis_mask,
                   const tensor out_size,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input, begin_id, end_id, strides_id}, output_padding),
+        : primitive_base(id, {input, begin_id, end_id, strides_id}, ext_prim_id, output_padding),
           begin_mask(begin_mask),
           end_mask(end_mask),
           new_axis_mask(new_axis_mask),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/tile.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/tile.hpp
index 5cc8a7c005f..43055b1a1a1 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/tile.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/tile.hpp
@@ -33,8 +33,9 @@ struct tile : public primitive_base<tile> {
     tile(const primitive_id& id,
          const primitive_id& input,
          const tensor out_shape,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), out_shape(out_shape) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), out_shape(out_shape) {}
 
     /// @brief Shape of the output tensor
     tensor out_shape;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/debug_configuration.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/debug_configuration.hpp
index c43abac85e3..357f290efdb 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/debug_configuration.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/debug_configuration.hpp
@@ -12,7 +12,7 @@
 #define GPU_DEBUG_IF(cond) if (0)
 #endif
 
-#define GPU_DEBUG_COUT std::cout << debug_configuration::prefix
+#define GPU_DEBUG_COUT std::cout << cldnn::debug_configuration::prefix
 // Macro below is inserted to avoid unused variable warning when GPU_DEBUG_CONFIG is OFF
 #define GPU_DEBUG_GET_INSTANCE(name) auto name = cldnn::debug_configuration::get_instance(); (void)(name);
 
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/engine.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/engine.hpp
index fb79a20a785..acec6f58e58 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/engine.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/engine.hpp
@@ -21,6 +21,10 @@
 #define CLDNN_THREADING_TBB 1
 #define CLDNN_THREADING_THREADPOOL 2
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+#include <oneapi/dnnl/dnnl.hpp>
+#endif
+
 namespace cldnn {
 
 class stream;
@@ -120,6 +124,11 @@ public:
     /// Returns service stream which can be used during program build and optimizations
     virtual stream& get_program_stream() const = 0;
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+    /// Returns onednn engine object which shares device and context with current engine
+    virtual dnnl::engine& get_onednn_engine() const = 0;
+#endif
+
     /// Factory method which creates engine object with impl configured by @p engine_type
     /// @param engine_type requested engine type
     /// @param runtime_type requested execution runtime for the engine. @note some runtime/engine types configurations might be unsupported
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/layout.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/layout.hpp
index 4962cd00963..4b694ed0f6c 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/layout.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/layout.hpp
@@ -14,6 +14,7 @@
 #include <limits>
 #include <string>
 #include <functional>
+#include <set>
 
 namespace cldnn {
 /// @addtogroup cpp_api C++ API
@@ -121,6 +122,8 @@ struct data_type_traits {
                 return alignof(data_type_to_type<data_types::bin>::type);
             case data_types::i8:
                 return alignof(data_type_to_type<data_types::i8>::type);
+            case data_types::u8:
+                return alignof(data_type_to_type<data_types::u8>::type);
             case data_types::i32:
                 return alignof(data_type_to_type<data_types::i32>::type);
             case data_types::i64:
@@ -395,20 +398,33 @@ struct layout {
     size_t get_linear_size() const {
         auto sizes = get_buffer_size().sizes();
 
-        for (const auto& block : this->format.block_sizes()) {
-            auto block_axis = block.first;
-            auto block_size = block.second;
+        std::set<size_t> processed_dims;
+        const auto& blocks = format.block_sizes();
+        for (size_t i = 0; i < blocks.size(); i++) {
+            if (processed_dims.count(blocks[i].first))
+                continue;
+
+            auto block_axis = blocks[i].first;
+            auto block_size = blocks[i].second;
+
+            for (size_t j = i + 1; j < blocks.size(); j++) {
+                if (blocks[j].first != block_axis)
+                    continue;
+
+                block_size *= blocks[j].second;
+            }
 
             sizes[block_axis] = align_to(sizes[block_axis], block_size);
+            processed_dims.insert(block_axis);
         }
 
-        if (this->format == cldnn::format::os_is_yx_isa8_osv8_isv4 && !(is_aligned_to(sizes[0], 8)) && !(is_aligned_to(sizes[1], 32))) {
+        if (this->format == cldnn::format::os_is_yx_isa8_osv8_isv4 && (!(is_aligned_to(sizes[0], 8)) || !(is_aligned_to(sizes[1], 32)))) {
             sizes[0] = align_to(sizes[0], 8);
             sizes[1] = align_to(sizes[1], 32);
-        } else if (this->format == cldnn::format::os_is_yx_isa8_osv16_isv4 && !(is_aligned_to(sizes[0], 16)) && !(is_aligned_to(sizes[1], 32))) {
+        } else if (this->format == cldnn::format::os_is_yx_isa8_osv16_isv4 && (!(is_aligned_to(sizes[0], 16)) || !(is_aligned_to(sizes[1], 32)))) {
             sizes[0] = align_to(sizes[0], 16);
             sizes[1] = align_to(sizes[1], 32);
-        } else if (this->format == cldnn::format::os_is_yx_isa8_osv8_isv4_swizzled_by_4 && !(is_aligned_to(sizes[0], 32)) && !(is_aligned_to(sizes[1], 32))) {
+        } else if (this->format == cldnn::format::os_is_yx_isa8_osv8_isv4_swizzled_by_4 && (!(is_aligned_to(sizes[0], 32)) || !(is_aligned_to(sizes[1], 32)))) {
             sizes[0] = align_to(sizes[0], 32);
             sizes[1] = align_to(sizes[1], 32);
         } else if (this->format == cldnn::format::is_o32_yx_isv32_swizzled_by_4 && (!is_aligned_to(sizes[1], 32) || !(is_aligned_to(sizes[0], 32)))) {
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/memory.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/memory.hpp
index e054e90a477..d4e1983df9b 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/memory.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/memory.hpp
@@ -9,6 +9,10 @@
 #include "event.hpp"
 #include "engine_configuration.hpp"
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+#include <oneapi/dnnl/dnnl.hpp>
+#endif
+
 namespace cldnn {
 
 class engine;
@@ -57,6 +61,12 @@ struct memory {
     virtual event::ptr copy_from(stream& /* stream */, const memory& /* other */) = 0;
     virtual event::ptr copy_from(stream& /* stream */, const void* /* host_ptr */) = 0;
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+    virtual dnnl::memory get_onednn_memory(dnnl::memory::desc /* desc */) {
+        throw std::runtime_error("[CLDNN] Can't convert memory object to onednn");
+    }
+#endif
+
 protected:
     engine* _engine;
     const layout _layout;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/stream.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/stream.hpp
index 7ff5afd5815..63e9dc7a8ba 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/stream.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/stream.hpp
@@ -11,6 +11,10 @@
 #include <memory>
 #include <vector>
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+#include <oneapi/dnnl/dnnl.hpp>
+#endif
+
 namespace cldnn {
 
 class stream {
@@ -37,6 +41,11 @@ public:
 
     queue_types get_queue_type() const { return queue_type; }
 
+
+#ifdef ENABLE_ONEDNN_FOR_GPU
+    virtual dnnl::stream& get_onednn_stream() = 0;
+#endif
+
 protected:
     queue_types queue_type;
 };
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/tensor.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/tensor.hpp
index 1d2c9ff8e49..193b421da72 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/tensor.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/tensor.hpp
@@ -90,6 +90,10 @@ struct format {
         b_fs_zyx_fsv32,                         ///< format used for blocked int8 3d convolution
         bs_fs_zyx_bsv16_fsv16,                  ///< format used for 3D blocked convolution (batch and features blocked by 16)
         bs_fs_yx_bsv16_fsv16,                   ///< format used for 2D blocked convolution (batch and features blocked by 16)
+        bs_fs_yx_bsv4_fsv4,                     ///< format used for 2D blocked convolution (batch and features blocked by 4)
+        bs_fs_yx_bsv4_fsv2,                     ///< format used for 2D blocked convolution (batch blocked by 4, features blocked by 2)
+        bs_fs_yx_bsv32_fsv32,                   ///< format used for big batches (batch and features blocked by 32)
+        bs_fs_yx_bsv32_fsv16,                   ///< format used for big batches (batch blocked by 32, features blocked by 16)
         fs_b_yx_fsv32,                          ///< format for input for fp16 primitives
         b_fs_yx_fsv4,                           ///< format for input for IMAD convolutions
         bs_xs_xsv8_bsv8,                        ///< format used only for fully connected weights: bs - batch slice,
@@ -110,7 +114,9 @@ struct format {
         oizyx,                                        ///< the most common format for 3D convolution
         iozyx,                                        ///< 3D weights format for deconvolutions
         iyxo,
-        os_iyx_osv16,                                 ///< format used only for convolution weights:
+        os_iyx_osv16,                                 ///< format used only for convolution weights
+        o_is_yx_isv16,                                ///< format used only for convolution weights
+        os_yxi_osv16,                                 ///< format used only for convolution weights
         os_is_yx_osv16_isv16,                         ///< format used for convolution i8 weights
         os_is_zyx_osv32_isv16,
         os_is_zyx_osv64_isv16,
@@ -150,11 +156,17 @@ struct format {
         os_is_yx_isa8_osv8_isv4_swizzled_by_4,        ///< format for weights for MMAD convolution
         os_is_yx_osa4_isa8_osv8_isv4_swizzled_by_4,   ///< format for weights for MMAD fsv32 convolution
         os_is_zyx_osa4_isa8_osv8_isv4_swizzled_by_4,  ///< format for weights for MMAD fsv32 convolution
+        os_is_yx_osa4_isa8_osv8_isv4,                 ///< format for weights for MMAD fsv32 convolution
+        g_os_is_yx_osa4_isa8_osv8_isv4,               ///< format for weights for MMAD fsv32 convolution
+        g_os_is_yx_osa4_isa8_osv8_isv2,               ///< format for weights for MMAD fsv32 convolution
+        os_is_yx_osa4_isa8_osv8_isv2,                 ///< format for weights for MMAD fsv32 convolution
         is_o_yx_isv32,                                ///< format for weights for 1x1 MMAD convolutions
         is_o32_yx_isv32_swizzled_by_4,                ///< format for weights for 1x1 MMAD convolutions
         os_is_y_x8_osv8_isv4,                         ///< format for weights for 1x1 MMAD convolutions
         os_is_y_x8_osv8_isv4_swizzled_by_4,           ///< format for weights for 1x1 MMAD convolutions
         os_is_yx_osv16_isv4,                          ///< format for weights for IMAD convolutions
+        os_is_yx_osv8_isv4,                           ///< format used for convolution i8 weights
+        os_is_yx_osv8_isv2,                           ///< format used for convolution i8 weights
         os_is_zyx_osv16_isv16,                        ///< format for weights for IMAD convolutions
         os_is_yx_osv32_isv4_swizzled_by_2,            ///< format for weights for IMAD convolutions
         os_is_yx_osv32_isv4,                          ///< format for weights for IMAD convolutions
@@ -236,6 +248,10 @@ struct format {
                 { b_fs_zyx_fsv16,        { 1, 1, 3, 0, 0, "bfzyx",  "bfxyz",  {{1, 16}}}},
                 { bs_fs_zyx_bsv16_fsv16, { 1, 1, 3, 0, 0, "bfzyx",  "bfxyz",  {{0, 16 }, {1, 16}}}},
                 { bs_fs_yx_bsv16_fsv16,  { 1, 1, 2, 0, 0, "bfyx",   "bfxy?",  {{0, 16 }, {1, 16}}}},
+                { bs_fs_yx_bsv4_fsv4,    { 1, 1, 2, 0, 0, "bfyx",   "bfxy?",  {{0, 4 }, {1, 4}}}},
+                { bs_fs_yx_bsv4_fsv2,    { 1, 1, 2, 0, 0, "bfyx",   "bfxy?",  {{0, 4 }, {1, 2}}}},
+                { bs_fs_yx_bsv32_fsv32,  { 1, 1, 2, 0, 0, "bfyx",   "bfxy?",  {{0, 32 }, {1, 32}}}},
+                { bs_fs_yx_bsv32_fsv16,  { 1, 1, 2, 0, 0, "bfyx",   "bfxy?",  {{0, 32 }, {1, 16}}}},
                 { nv12,                  { 1, 1, 2, 0, 0, "bfyx",   "bfxy?",  {}}},
                 { image_2d_rgba,         { 1, 1, 2, 0, 0, "bfyx",   "bfxy?",  {}}},
 
@@ -246,6 +262,8 @@ struct format {
                 { oizyx,                                       { 1, 1, 3, 0, 0, "oizyx",  "oixyz",      {}}},
                 { iozyx,                                       { 1, 1, 3, 0, 0, "iozyx",  "oixyz",      {}}},
                 { os_is_yx_isv16_osv16,                        { 1, 1, 2, 0, 0, "oiyx",   "oixy",       {{1, 16}, {0, 16}}}},
+                { o_is_yx_isv16,                               { 1, 1, 2, 0, 0, "oiyx",   "oixy?",      {{1, 16}}}},
+                { os_yxi_osv16,                                { 1, 1, 2, 0, 0, "oyxi",   "oixy?",      {{0, 16}}}},
                 { os_iyx_osv16,                                { 1, 1, 2, 0, 0, "oiyx",   "oixy?",      {{0, 16}}}},
                 { os_iyx_osv32,                                { 1, 1, 2, 0, 0, "oiyx",   "oixy?",      {{0, 32}}}},
                 { os_iyx_osv64,                                { 1, 1, 2, 0, 0, "oiyx",   "oixy?",      {{0, 64}}}},
@@ -260,6 +278,8 @@ struct format {
                 { os_is_yx_isa8_osv8_isv4,                     { 1, 1, 2, 0, 0, "oiyx",   "oixy?",      {}}},
                 { os_is_yx_isa8_osv16_isv4,                    { 1, 1, 2, 0, 0, "oiyx",   "oixy?",      {}}},
                 { os_is_yx_isa8_osv8_isv4_swizzled_by_4,       { 1, 1, 2, 0, 0, "oiyx",   "oixy?",      {}}},
+                { os_is_yx_osa4_isa8_osv8_isv4,                { 1, 1, 2, 0, 0, "oiyx",   "oixy?",      {{0, 32}, {1, 32}}}},
+                { os_is_yx_osa4_isa8_osv8_isv2,                { 1, 1, 2, 0, 0, "oiyx",   "oixy?",      {{0, 32}, {1, 16}}}},
                 { os_is_zyx_isa8_osv8_isv4,                    { 1, 1, 3, 0, 0, "oizyx",  "oixyz",      {{1, 8}, {0, 8}, {1, 4}}}},
                 { os_is_zyx_isa8_osv16_isv4,                   { 1, 1, 3, 0, 0, "oizyx",  "oixyz",      {{1, 8}, {0, 16}, {1, 4}}}},
                 { os_is_yx_osa4_isa8_osv8_isv4_swizzled_by_4,  { 1, 1, 2, 0, 0, "oiyx",   "oixy?",      {{0, 32}, {1, 32}}}},
@@ -269,6 +289,8 @@ struct format {
                 { os_is_y_x8_osv8_isv4,                        { 1, 1, 2, 0, 0, "oyxi",   "oixy?",      {}}},
                 { os_is_y_x8_osv8_isv4_swizzled_by_4,          { 1, 1, 2, 0, 0, "oyxi",   "oixy?",      {}}},
                 { os_is_yx_osv16_isv4,                         { 1, 1, 2, 0, 0, "oixy",   "oixy?",      {{0, 16}, {1, 4}}}},
+                { os_is_yx_osv8_isv4,                          { 1, 1, 2, 0, 0, "oiyx",   "oixy",       {{1, 4}, {0, 8}}}},
+                { os_is_yx_osv8_isv2,                          { 1, 1, 2, 0, 0, "oiyx",   "oixy",       {{1, 2}, {0, 8}}}},
                 { os_is_zyx_osv16_isv16,                       { 1, 1, 3, 0, 0, "oizyx",  "oixyz",      {{0, 16}, {1, 16}}}},
                 { os_is_yx_osv32_isv4_swizzled_by_2,           { 1, 1, 2, 0, 0, "oixy",   "oixy?",      {{0, 32}, {1, 4}}}},
                 { os_is_yx_osv32_isv4,                         { 1, 1, 2, 0, 0, "oixy",   "oixy?",      {{0, 32}, {1, 4}}}},
@@ -313,6 +335,8 @@ struct format {
                 { g_os_zyx_is_osv32_isv4,                      { 1, 1, 3, 0, 1, "gozyxi", "oixyz???g",  {{0, 32}, {1, 4}}}},
                 { g_os_zyx_is_osv32_isv16,                     { 1, 1, 3, 0, 1, "gozyxi", "oixyz???g",  {{0, 32}, {1, 16}}}},
                 { g_os_zyx_is_osv32_isv32,                     { 1, 1, 3, 0, 1, "gozyxi", "oixyz???g",  {{0, 32}, {1, 32}}}},
+                { g_os_is_yx_osa4_isa8_osv8_isv4,              { 1, 1, 2, 0, 1, "goiyx",  "oixy????g",  {{0, 32}, {1, 32}}}},
+                { g_os_is_yx_osa4_isa8_osv8_isv2,              { 1, 1, 2, 0, 1, "goiyx",  "oixy????g",  {{0, 32}, {1, 16}}}},
                 { gs_oi_yxs_gsv4_yxsv4,                        { 1, 1, 2, 0, 1, "goiyx",  "oixy????g",  {{8, 4}}}},
                 { gs_oi_yxs_gsv16_yxsv4,                       { 1, 1, 2, 0, 1, "goiyx",  "oixy????g",  {{8, 16}}}},
                 { gs_oi_yxs_gsv32_yxsv4,                       { 1, 1, 2, 0, 1, "goiyx",  "oixy????g",  {{8, 32}}}},
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/common/tensor_type.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/common/tensor_type.cpp
index d193edab5a0..b951c85e12c 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/common/tensor_type.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/common/tensor_type.cpp
@@ -28,6 +28,10 @@ DataTensor::DataChannelArray DataTensor::dataChannelArray {{
     { DataLayout::b_fs_zyx_fsv32,        {  0,  1,  2, -1,  3,  4 } },
     { DataLayout::bs_fs_zyx_bsv16_fsv16, {  0,  1,  2, -1,  3,  4 } },
     { DataLayout::bs_fs_yx_bsv16_fsv16,  {  0,  1, -1, -1,  2,  3 } },
+    { DataLayout::bs_fs_yx_bsv4_fsv4,    {  0,  1, -1, -1,  2,  3 } },
+    { DataLayout::bs_fs_yx_bsv4_fsv2,    {  0,  1, -1, -1,  2,  3 } },
+    { DataLayout::bs_fs_yx_bsv32_fsv32,  {  0,  1, -1, -1,  2,  3 } },
+    { DataLayout::bs_fs_yx_bsv32_fsv16,  {  0,  1, -1, -1,  2,  3 } },
     { DataLayout::bs_f_bsv8__af8,        { -1, -1, -1, -1,  0,  1 } },
     { DataLayout::bs_f_bsv16__af8,       { -1, -1, -1, -1,  0,  1 } },
     { DataLayout::winograd_2x3_s1_data,  {  2,  1, -1, -1,  0,  3 } },
@@ -54,6 +58,8 @@ WeightsTensor::WeightsChannelArray WeightsTensor::weightsChannelArray {{
     { WeightsLayout::os_iyx_osv32__ai32,                          {  0,  1, -1,   2,   3, -1, -1, -1 } },
     { WeightsLayout::os_iyx_osv64,                                {  0,  1, -1,   2,   3, -1, -1, -1 } },
     { WeightsLayout::os_iyx_osv16_rotate_180,                     {  0,  1, -1,   2,   3, -1, -1, -1 } },
+    { WeightsLayout::o_is_yx_isv16,                               {  0,  1, -1,   2,   3, -1, -1, -1 } },
+    { WeightsLayout::os_yxi_osv16,                                {  1,  2, -1,   0,   3, -1, -1, -1 } },
     { WeightsLayout::os_i_osv8__ai8,                              { -1, -1, -1,   0,   1, -1, -1, -1 } },
     { WeightsLayout::os_i_osv16__ai8,                             { -1, -1, -1,   0,   1, -1, -1, -1 } },
     { WeightsLayout::os_i_osv16,                                  { -1, -1, -1,   0,   1, -1, -1, -1 } },
@@ -76,6 +82,10 @@ WeightsTensor::WeightsChannelArray WeightsTensor::weightsChannelArray {{
     { WeightsLayout::os_is_yx_isa8_osv8_isv4,                     {  0,  1, -1,   2,   3, -1, -1, -1 } },
     { WeightsLayout::os_is_yx_isa8_osv16_isv4,                    {  0,  1, -1,   2,   3, -1, -1, -1 } },
     { WeightsLayout::os_is_yx_isa8_osv8_isv4_swizzled_by_4,       {  0,  1, -1,   2,   3, -1, -1, -1 } },
+    { WeightsLayout::os_is_yx_osa4_isa8_osv8_isv4,                {  0,  1, -1,   2,   3, -1, -1, -1 } },
+    { WeightsLayout::g_os_is_yx_osa4_isa8_osv8_isv4,              {  0,  1, -1,   2,   3, -1, -1,  4 } },
+    { WeightsLayout::g_os_is_yx_osa4_isa8_osv8_isv2,              {  0,  1, -1,   2,   3, -1, -1,  4 } },
+    { WeightsLayout::os_is_yx_osa4_isa8_osv8_isv2,                {  0,  1, -1,   2,   3, -1, -1, -1 } },
     { WeightsLayout::os_is_zyx_isa8_osv8_isv4,                    {  0,  1,  2,   3,   4, -1, -1, -1 } },
     { WeightsLayout::os_is_zyx_isa8_osv16_isv4,                   {  0,  1,  2,   3,   4, -1, -1, -1 } },
     { WeightsLayout::os_is_yx_osa4_isa8_osv8_isv4_swizzled_by_4,  {  0,  1, -1,   2,   3, -1, -1, -1 } },
@@ -84,6 +94,8 @@ WeightsTensor::WeightsChannelArray WeightsTensor::weightsChannelArray {{
     { WeightsLayout::is_o32_yx_isv32_swizzled_by_4,               {  1,  2, -1,   0,   3, -1, -1, -1 } },
     { WeightsLayout::os_is_y_x8_osv8_isv4,                        {  0,  1, -1,   2,   3, -1, -1, -1 } },
     { WeightsLayout::os_is_y_x8_osv8_isv4_swizzled_by_4,          {  0,  1, -1,   2,   3, -1, -1, -1 } },
+    { WeightsLayout::os_is_yx_osv8_isv4,                          {  0,  1, -1,   2,   3, -1, -1, -1 } },
+    { WeightsLayout::os_is_yx_osv8_isv2,                          {  0,  1, -1,   2,   3, -1, -1, -1 } },
     { WeightsLayout::os_is_yx_osv16_isv4,                         {  0,  1, -1,   2,   3, -1, -1, -1 } },
     { WeightsLayout::os_is_yx_osv32_isv4_swizzled_by_2,           {  0,  1, -1,   2,   3, -1, -1, -1 } },
     { WeightsLayout::os_is_yx_osv32_isv4,                         {  0,  1, -1,   2,   3, -1, -1, -1 } },
@@ -180,6 +192,26 @@ NDims DataTensor::GetSimpleDims(const std::vector<size_t>& d, DataLayout l) {
             newDims[3] = RoundUp(newDims[3], 16);
             newDims[4] = RoundUp(newDims[4], 16);
             break;
+        case bs_fs_yx_bsv4_fsv4:
+            assert(newDims.size() == 4);
+            newDims[2] = RoundUp(newDims[2], 4);
+            newDims[3] = RoundUp(newDims[3], 4);
+            break;
+        case bs_fs_yx_bsv4_fsv2:
+            assert(newDims.size() == 4);
+            newDims[2] = RoundUp(newDims[2], 2);
+            newDims[3] = RoundUp(newDims[3], 4);
+            break;
+        case bs_fs_yx_bsv32_fsv32:
+            assert(newDims.size() == 4);
+            newDims[2] = RoundUp(newDims[2], 32);
+            newDims[3] = RoundUp(newDims[3], 32);
+            break;
+        case bs_fs_yx_bsv32_fsv16:
+            assert(newDims.size() == 4);
+            newDims[2] = RoundUp(newDims[2], 16);
+            newDims[3] = RoundUp(newDims[3], 32);
+            break;
         default:
             break;
     }
@@ -391,7 +423,12 @@ NDims WeightsTensor::GetSimpleDims(const std::vector<size_t>& d, WeightsLayout l
 
     // TODO: It's not the right pitches. it's here in order to calculate physical size
     switch (l) {
+        case o_is_yx_isv16:
+            assert(newDims.size() == 4);
+            newDims[2] = RoundUp(newDims[2], 16);
+            break;
         case os_iyx_osv16:
+        case os_yxi_osv16:
         case os_iyx_osv16_rotate_180:
             assert(newDims.size() == 4);
             newDims[3] = RoundUp(newDims[3], 16);
@@ -481,6 +518,16 @@ NDims WeightsTensor::GetSimpleDims(const std::vector<size_t>& d, WeightsLayout l
             newDims[0] = RoundUp(newDims[0], 32);
             newDims[3] = RoundUp(newDims[3], 32);
             break;
+        case os_is_yx_osa4_isa8_osv8_isv4:
+        case g_os_is_yx_osa4_isa8_osv8_isv4:
+            newDims[3] = RoundUp(newDims[3], 32);
+            newDims[2] = RoundUp(newDims[2], 32);
+            break;
+        case os_is_yx_osa4_isa8_osv8_isv2:
+        case g_os_is_yx_osa4_isa8_osv8_isv2:
+            newDims[3] = RoundUp(newDims[3], 32);
+            newDims[2] = RoundUp(newDims[2], 16);
+            break;
         case os_is_y_x8_osv8_isv4:
         case os_is_y_x8_osv8_isv4_swizzled_by_4:
             assert(newDims.size() == 4);
@@ -543,6 +590,11 @@ NDims WeightsTensor::GetSimpleDims(const std::vector<size_t>& d, WeightsLayout l
             assert(newDims.size() == 5);
             newDims[3] = RoundUp(newDims[0], 16);
             break;
+        case os_is_yx_osv8_isv4:
+            assert(newDims.size() == 4);
+            newDims[2] = RoundUp(newDims[2], 4);
+            newDims[3] = RoundUp(newDims[3], 8);
+            break;
         case os_i_yxs_osv4_yxsv4:
             newDims[3] = RoundUp(newDims[3], 4);
             break;
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/common/tensor_type.h b/inference-engine/thirdparty/clDNN/kernel_selector/common/tensor_type.h
index f9c9b622e48..faf6aace4d6 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/common/tensor_type.h
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/common/tensor_type.h
@@ -38,6 +38,10 @@ enum DataLayout {
     b_fs_zyx_fsv32,         // 4D+batch
     bs_fs_yx_bsv16_fsv16,   // batch, feature, 2D spatial. Blocks of 16 batch and channels
     bs_fs_zyx_bsv16_fsv16,  // batch, feature, 3D spatial. Blocks of 16 batch and channels
+    bs_fs_yx_bsv4_fsv4,     // batch, feature, 2D spatial. Blocks of 4 batch and 4 channels
+    bs_fs_yx_bsv4_fsv2,     // batch, feature, 2D spatial. Blocks of 4 batch and 2 channels
+    bs_fs_yx_bsv32_fsv32,   // batch, feature, 2D spatial. Blocks of 32 batch and 32 channels
+    bs_fs_yx_bsv32_fsv16,   // batch, feature, 2D spatial. Blocks of 32 batch and 16 channels
     bs_f_bsv8__af8,         // for optimized FC
     bs_f_bsv16__af8,        // for optimized FC
     winograd_2x3_s1_data,   // winograd convolution input, F(2,3) -- filter 3x3 with stride 1
@@ -62,6 +66,8 @@ enum WeightsLayout {
     oyxi,
     iyxo,
     yxio,
+    o_is_yx_isv16,
+    os_yxi_osv16,
     os_iyx_osv16,
     os_iyx_osv32,
     os_iyx_osv32__ai32,
@@ -98,6 +104,10 @@ enum WeightsLayout {
     os_is_zyx_isa8_osv8_isv4,                // for MMAD convolution
     os_is_yx_isa8_osv16_isv4,                // for fully connected MMAD
     os_is_zyx_isa8_osv16_isv4,               // for fully connected MMAD
+    os_is_yx_osa4_isa8_osv8_isv4,            // for MMAD convolution swizzled from ofm 0..7 to 0,4,8,12,16,20,24,28,
+    g_os_is_yx_osa4_isa8_osv8_isv4,          // for MMAD convolution swizzled from ofm 0..7 to 0,4,8,12,16,20,24,28,
+    g_os_is_yx_osa4_isa8_osv8_isv2,          // for MMAD convolution swizzled from ofm 0..7 to 0,4,8,12,16,20,24,28,
+    os_is_yx_osa4_isa8_osv8_isv2,            // for MMAD convolution swizzled from ofm 0..7 to 0,4,8,12,16,20,24,28,
     os_is_yx_osa4_isa8_osv8_isv4_swizzled_by_4,  // for MMAD convolution swizzled from ofm 0..7 to 0,4,8,12,16,20,24,28,
                                                  // 1,5...
     os_is_zyx_osa4_isa8_osv8_isv4_swizzled_by_4,  // for MMAD convolution swizzled from ofm 0..7 to 0,4,8,12,16,20,24,28,
@@ -110,6 +120,8 @@ enum WeightsLayout {
     os_is_y_x8_osv8_isv4_swizzled_by_4,  // for MMAD 1x1 convolutions swizzled from ofm 0..7 to 0,4,8,12,16,20,24,28,
                                          // 1,5...
     os_is_yx_osv16_isv4,                 // swizzled weights for convolution using IMAD
+    os_is_yx_osv8_isv4,                      // weights for int8 blocked conv
+    os_is_yx_osv8_isv2,                      // weights for int8 blocked conv
     os_is_yx_osv32_isv4_swizzled_by_2,   //  weights for bfyx -> b_fs_yx_fsv32 convolution using IMAD with swizzeled ofm (0, 2, 4..), (1, 3, 5...)
     os_is_yx_osv32_isv4,                 //  weights for bfyx -> b_fs_yx_fsv{32,16} convolution using IMAD
     os_is_zyx_osv32_isv4,                //  weights for bfzyx -> b_fs_zyx_fsv16 convolution using IMAD
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/activation/activation_kernel_base.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/activation/activation_kernel_base.cpp
index a8d25d6b906..48249760d63 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/activation/activation_kernel_base.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/activation/activation_kernel_base.cpp
@@ -16,9 +16,12 @@ ActivationKernelBase::DispatchData ActivationKernelBase::SetDefault(const activa
     if (out.GetLayout() == DataLayout::yxfb) {
         dispatchData.gws = {out.Feature().v * out.Batch().v, out.X().v, out.Y().v};
         dispatchData.lws = GetOptimalLocalWorkGroupSizes(dispatchData.gws, arg.engineInfo);
-    } else if (out.GetLayout() == DataLayout::b_fs_yx_fsv16) {
+    } else if (out.GetLayout() == DataLayout::b_fs_yx_fsv16 || out.GetLayout() == DataLayout::b_fs_yx_fsv32) {
         dispatchData.gws = {Align(out.Feature().v, 16) * out.Batch().v, out.X().v, out.Y().v};
         dispatchData.lws = {16, 1, 1};
+    } else if (out.GetLayout() == DataLayout::bs_fs_yx_bsv32_fsv16 || out.GetLayout() == DataLayout::bs_fs_yx_bsv32_fsv32) {
+        dispatchData.gws = {out.X().v * out.Y().v, Align(out.Feature().v, 16), Align(out.Batch().v, 16)};
+        dispatchData.lws = {1, 16, 16};
     } else {
         dispatchData.gws = {out.X().v, out.Y().v * out.Z().v, out.Feature().v * out.Batch().v};
         dispatchData.lws = GetOptimalLocalWorkGroupSizes(dispatchData.gws, arg.engineInfo);
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/activation/activation_kernel_opt.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/activation/activation_kernel_opt.cpp
index db7270cd306..8493fc9b5b9 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/activation/activation_kernel_opt.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/activation/activation_kernel_opt.cpp
@@ -10,6 +10,7 @@ namespace kernel_selector {
 
 ParamsKey ActivationKernelOpt::GetSupportedKey() const {
     ParamsKey k;
+    k.EnableInputDataType(Datatype::UINT8);
     k.EnableInputDataType(Datatype::INT8);
     k.EnableInputDataType(Datatype::INT32);
     k.EnableInputDataType(Datatype::F16);
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/concatenation/concatenation_kernel_simple_ref.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/concatenation/concatenation_kernel_simple_ref.cpp
index bb5fa8b8a34..7832297e27a 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/concatenation/concatenation_kernel_simple_ref.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/concatenation/concatenation_kernel_simple_ref.cpp
@@ -40,6 +40,8 @@ ParamsKey ConcatenationKernel_simple_Ref::GetSupportedKey() const {
     k.EnableOutputLayout(DataLayout::bs_fs_zyx_bsv16_fsv16);
     k.EnableInputLayout(DataLayout::bs_fs_yx_bsv16_fsv16);
     k.EnableOutputLayout(DataLayout::bs_fs_yx_bsv16_fsv16);
+    k.EnableInputLayout(DataLayout::bs_fs_yx_bsv32_fsv32);
+    k.EnableOutputLayout(DataLayout::bs_fs_yx_bsv32_fsv32);
     k.EnableTensorOffset();
     k.EnableTensorPitches();
     k.EnableBatching();
@@ -66,7 +68,8 @@ bool ConcatenationKernel_simple_Ref::Validate(const Params& p, const optional_pa
     for (const auto& lt : params.inputs) {
         auto cur_layout = lt.GetLayout();
         if ((cur_layout == DataLayout::bfzyx || cur_layout == DataLayout::b_fs_zyx_fsv16 || cur_layout == DataLayout::bs_fs_zyx_bsv16_fsv16) &&
-            (same_layout == DataLayout::bfzyx || same_layout == DataLayout::b_fs_zyx_fsv16 || same_layout == DataLayout::bs_fs_zyx_bsv16_fsv16)) {
+            (same_layout == DataLayout::bfzyx || same_layout == DataLayout::b_fs_zyx_fsv16 || same_layout == DataLayout::bs_fs_zyx_bsv16_fsv16
+            || same_layout == DataLayout::bs_fs_yx_bsv32_fsv32)) {
             continue;
         } else if (cur_layout != same_layout) {
             return false;
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/eltwise/eltwise_kernel_base.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/eltwise/eltwise_kernel_base.cpp
index 42fee4026ac..e4cf66c57bb 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/eltwise/eltwise_kernel_base.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/eltwise/eltwise_kernel_base.cpp
@@ -39,6 +39,25 @@ static uint32_t GetNumberOfInputs(EltwiseMode m) {
     }
 }
 
+std::vector<size_t> GetLimitedOptimalLocalWorkGroupSizes(std::vector<size_t> gws, const EngineInfo& info, std::vector<size_t> limited_size_lws) {
+    const size_t lws_max = info.maxWorkGroupSize;
+    const size_t optimal_lws_values[] = {256, 227, 224, 192, 160, 128, 96, 64, 32, 16, 8, 7, 6, 5, 4, 2, 1};
+    size_t total_lws = 1;
+    std::vector<size_t> lws;
+    for (size_t i = 0; i < gws.size(); ++i) {
+        auto rest_lws = lws_max / total_lws;
+        size_t lws_idx = 0;
+        while (rest_lws < optimal_lws_values[lws_idx] || optimal_lws_values[lws_idx] > limited_size_lws[i]) lws_idx++;
+
+        while (gws[i] % optimal_lws_values[lws_idx]) lws_idx++;
+
+        lws.push_back(optimal_lws_values[lws_idx]);
+        total_lws *= optimal_lws_values[lws_idx];
+    }
+
+    return lws;
+}
+
 ParamsKey eltwise_params::GetParamsKey() const {
     ParamsKey k = base_params::GetParamsKey();
 
@@ -569,6 +588,7 @@ EltwiseKernelBase::DispatchData EltwiseKernelBase::SetDefault(const eltwise_para
     const size_t optimal_lws_values[] = {256, 224, 192, 160, 128, 96, 64, 32, 16};
     if ((params.output.GetLayout() == DataLayout::b_fs_yx_fsv16 ||
          params.output.GetLayout() == DataLayout::b_fs_zyx_fsv16 ||
+         params.output.GetLayout() == DataLayout::bs_fs_yx_bsv32_fsv16 ||
          params.output.GetLayout() == DataLayout::bs_fs_yx_bsv16_fsv16) &&
         params.output.Feature().v % 16 == 0 && dispatchData.gws[1] % 16 == 0) {
         dispatchData.lws[0] = 1;
@@ -584,17 +604,21 @@ EltwiseKernelBase::DispatchData EltwiseKernelBase::SetDefault(const eltwise_para
         dispatchData.lws[0] = 1;
         dispatchData.lws[1] = 1;
         dispatchData.lws[2] = 32;
-    } else if (params.output.GetLayout() == DataLayout::b_fs_yx_fsv32 && params.output.Feature().v % 32 == 0) {
+    } else if ((params.output.GetLayout() == DataLayout::b_fs_yx_fsv32 ||
+                params.output.GetLayout() == DataLayout::bs_fs_yx_bsv32_fsv32)) {
         if (params.layoutBased || params.int8_quantization || params.broadcast) {
-            dispatchData.lws[0] = 1;
-            dispatchData.lws[1] = 32;
-            dispatchData.lws[2] = 1;
+            auto bs_fsv32_local = GetLimitedOptimalLocalWorkGroupSizes({dispatchData.gws[1], dispatchData.gws[2], dispatchData.gws[0]},
+                                                                        params.engineInfo, {32, 32, 1024});
+            dispatchData.lws[0] = bs_fsv32_local[2];
+            dispatchData.lws[1] = bs_fsv32_local[0];
+            dispatchData.lws[2] = bs_fsv32_local[1];
         } else if (dispatchData.gws[0] == params.output.LogicalSize()) {
             dispatchData.lws = local;
         } else {
-            dispatchData.lws[0] = 1;
-            dispatchData.lws[1] = 1;
-            dispatchData.lws[2] = 32;
+            auto bs_fsv32_local = GetOptimalLocalWorkGroupSizes({dispatchData.gws[2], dispatchData.gws[0], dispatchData.gws[1]}, params.engineInfo);
+            dispatchData.lws[0] = bs_fsv32_local[1];
+            dispatchData.lws[1] = bs_fsv32_local[2];
+            dispatchData.lws[2] = bs_fsv32_local[0];
         }
     } else {
         dispatchData.lws[0] = local[0];
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/lrn/lrn_kernel_across_channel_multiple_features_fsv16.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/lrn/lrn_kernel_across_channel_multiple_features_fsv16.cpp
index 0d41e177310..8e3834b03af 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/lrn/lrn_kernel_across_channel_multiple_features_fsv16.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/lrn/lrn_kernel_across_channel_multiple_features_fsv16.cpp
@@ -16,7 +16,13 @@ ParamsKey LRNKernelAcrossChannelMultipleFeaturesFSV16::GetSupportedKey() const {
     k.EnableOutputDataType(Datatype::INT8);
     k.EnableOutputDataType(Datatype::UINT8);
     k.EnableInputLayout(DataLayout::b_fs_yx_fsv16);
+    k.EnableInputLayout(DataLayout::b_fs_yx_fsv32);
+    k.EnableInputLayout(DataLayout::bs_fs_yx_bsv32_fsv16);
+    k.EnableInputLayout(DataLayout::bs_fs_yx_bsv32_fsv32);
     k.EnableOutputLayout(DataLayout::b_fs_yx_fsv16);
+    k.EnableOutputLayout(DataLayout::b_fs_yx_fsv32);
+    k.EnableOutputLayout(DataLayout::bs_fs_yx_bsv32_fsv16);
+    k.EnableOutputLayout(DataLayout::bs_fs_yx_bsv32_fsv32);
     k.EnableLRNMode(LRNMode::ACROSS_CHANNEL);
     k.EnableLRNKernelDividerMode(KernelDividerMode::FIXED);
     k.EnableTensorOffset();
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/pooling/pooling_kernel_gpu_int8_ref.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/pooling/pooling_kernel_gpu_int8_ref.cpp
index c2d7f89acd7..d40abe51608 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/pooling/pooling_kernel_gpu_int8_ref.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/pooling/pooling_kernel_gpu_int8_ref.cpp
@@ -22,6 +22,7 @@ ParamsKey PoolingKernelGPUInt8Ref::GetSupportedKey() const {
     k.EnableInputLayout(DataLayout::b_fs_yx_fsv32);
     k.EnableInputLayout(DataLayout::b_fs_zyx_fsv32);
     k.EnableInputLayout(DataLayout::b_fs_yx_fsv16);
+    k.EnableInputLayout(DataLayout::bs_fs_yx_bsv32_fsv32);
     k.EnableOutputLayout(DataLayout::bfyx);
     k.EnableOutputLayout(DataLayout::bfzyx);
     k.EnableOutputLayout(DataLayout::yxfb);
@@ -30,6 +31,7 @@ ParamsKey PoolingKernelGPUInt8Ref::GetSupportedKey() const {
     k.EnableOutputLayout(DataLayout::b_fs_yx_fsv32);
     k.EnableOutputLayout(DataLayout::b_fs_zyx_fsv32);
     k.EnableOutputLayout(DataLayout::b_fs_yx_fsv16);
+    k.EnableOutputLayout(DataLayout::bs_fs_yx_bsv32_fsv32);
     k.EnableTensorOffset();
     k.EnableTensorPitches();
     k.EnableBatching();
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/quantize/quantize_kernel_scale_shift_opt.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/quantize/quantize_kernel_scale_shift_opt.cpp
index c0dee93c4b6..733f6612777 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/quantize/quantize_kernel_scale_shift_opt.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/quantize/quantize_kernel_scale_shift_opt.cpp
@@ -8,6 +8,7 @@
 #include <string>
 
 static const size_t sub_group_size = 32;
+static const size_t feature_size = 32;
 
 namespace kernel_selector {
 ParamsKey QuantizeKernelScaleShift::GetSupportedKey() const {
@@ -43,6 +44,14 @@ CommonDispatchData QuantizeKernelScaleShift::SetDefault(const quantize_params& p
         dispatchData.lws[0] = 1;
         dispatchData.lws[1] = sub_group_size;
         dispatchData.lws[2] = 1;
+    } else if (output.GetLayout() == DataLayout::bs_fs_yx_bsv32_fsv32) {
+        dispatchData.gws[0] = output.Y().v * output.X().v;
+        dispatchData.gws[1] = Align(output.Feature().v, feature_size);
+        dispatchData.gws[2] = Align(output.Batch().v, feature_size);
+
+        dispatchData.lws[0] = 1;
+        dispatchData.lws[1] = feature_size;
+        dispatchData.lws[2] = params.engineInfo.maxWorkGroupSize / feature_size;
     } else {
         dispatchData.gws = GetTensorFriendlyWorkGroups(output);
         dispatchData.lws = GetOptimalLocalWorkGroupSizes(dispatchData.gws, params.engineInfo);
@@ -54,7 +63,8 @@ CommonDispatchData QuantizeKernelScaleShift::SetDefault(const quantize_params& p
 JitConstants QuantizeKernelScaleShift::GetJitConstants(const quantize_params& params, const CommonDispatchData& dispatchData) const {
     JitConstants jit = Parent::GetJitConstants(params, dispatchData);
 
-    if (params.output.GetLayout() == DataLayout::b_fs_yx_fsv16) {
+    if (params.output.GetLayout() == DataLayout::b_fs_yx_fsv16 ||
+        params.output.GetLayout() == DataLayout::bs_fs_yx_bsv32_fsv32) {
         jit.AddConstant(MakeJitConstant("GWS_BATCH", 2));
         jit.AddConstant(MakeJitConstant("GWS_FEATURE", 1));
         jit.AddConstant(MakeJitConstant("GWS_YX", 0));
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/reorder/reorder_kernel_base.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/reorder/reorder_kernel_base.cpp
index 70a178a314b..2762223ef83 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/reorder/reorder_kernel_base.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/reorder/reorder_kernel_base.cpp
@@ -177,7 +177,11 @@ ReorderKernelBase::DispatchData ReorderKernelBase::SetDefault(const reorder_para
         }
     }
 
-    if (params.output.GetLayout() == DataLayout::bs_fs_yx_bsv16_fsv16 && params.inputs[0].Feature().v % 16 == 0) {
+    if ((params.output.GetLayout() == DataLayout::bs_fs_yx_bsv16_fsv16 ||
+         params.output.GetLayout() == DataLayout::bs_fs_yx_bsv32_fsv32 ||
+         params.output.GetLayout() == DataLayout::b_fs_yx_fsv16 ||
+         params.output.GetLayout() == DataLayout::bs_fs_yx_bsv32_fsv16) &&
+        params.inputs[0].Feature().v % 16 == 0) {
         dispatchData.lws[0] = 1;
         dispatchData.lws[1] = 16;
         dispatchData.lws[2] = 1;
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/resample/resample_kernel_opt.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/resample/resample_kernel_opt.cpp
index 388f64d0556..b0184dcfa1a 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/resample/resample_kernel_opt.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/resample/resample_kernel_opt.cpp
@@ -18,6 +18,15 @@ size_t ResampleKernelOpt::GetOptimalBlockSize(const resample_params& params) con
     return 1;
 }
 
+static size_t GetOptimalDivisor(const size_t input_size, size_t max_val = 16) {
+    for (size_t s = max_val; s > 0; --s) {
+        if (input_size % s == 0) {
+            return s;
+        }
+    }
+    return 1;
+}
+
 ParamsKey ResampleKernelOpt::GetSupportedKey() const {
     ParamsKey k;
     k.EnableInputDataType(Datatype::F16);
@@ -29,8 +38,14 @@ ParamsKey ResampleKernelOpt::GetSupportedKey() const {
     k.EnableOutputDataType(Datatype::UINT8);
     k.EnableOutputDataType(Datatype::INT8);
     k.EnableInputLayout(DataLayout::b_fs_yx_fsv16);
+    k.EnableInputLayout(DataLayout::b_fs_yx_fsv32);
+    k.EnableInputLayout(DataLayout::bs_fs_yx_bsv32_fsv16);
+    k.EnableInputLayout(DataLayout::bs_fs_yx_bsv32_fsv32);
     k.EnableInputLayout(DataLayout::fs_b_yx_fsv32);
     k.EnableOutputLayout(DataLayout::b_fs_yx_fsv16);
+    k.EnableOutputLayout(DataLayout::b_fs_yx_fsv32);
+    k.EnableOutputLayout(DataLayout::bs_fs_yx_bsv32_fsv16);
+    k.EnableOutputLayout(DataLayout::bs_fs_yx_bsv32_fsv32);
     k.EnableOutputLayout(DataLayout::fs_b_yx_fsv32);
     k.EnableDifferentTypes();
     k.EnableTensorOffset();
@@ -56,6 +71,11 @@ ResampleKernelBase::DispatchData ResampleKernelOpt::SetDefault(const kernel_sele
 
         dispatchData.lws = GetOptimalLocalWorkGroupSizes(dispatchData.gws, arg.engineInfo);
     } else {
+        auto opt_x_block_size = GetOptimalBlockSize(arg);
+        if (out.X().v > 32 && opt_x_block_size == 1) {
+            opt_x_block_size = GetOptimalDivisor(out.X().v, 32);
+        }
+
         dispatchData.gws[0] = CeilDiv(out.X().v, GetOptimalBlockSize(arg)) * out.Y().v;
         dispatchData.gws[1] = Align(out.Feature().v, sub_group_size);
         dispatchData.gws[2] = arg.output.Batch().v;
@@ -63,6 +83,11 @@ ResampleKernelBase::DispatchData ResampleKernelOpt::SetDefault(const kernel_sele
         dispatchData.lws[0] = 1;
         dispatchData.lws[1] = sub_group_size;
         dispatchData.lws[2] = 1;
+
+        if (arg.output.GetLayout() == DataLayout::bs_fs_yx_bsv32_fsv16
+            || arg.output.GetLayout() == DataLayout::bs_fs_yx_bsv32_fsv32) {
+            dispatchData.lws[2] = GetOptimalDivisor(dispatchData.gws[2]);
+        }
     }
 
     return dispatchData;
@@ -91,7 +116,11 @@ bool ResampleKernelOpt::Validate(const Params& p, const optional_params& o) cons
         params.resampleType != ResampleType::BILINEAR_INTERP)
         return false;
 
-    if (input.GetLayout() != DataLayout::fs_b_yx_fsv32 && input.GetLayout() != DataLayout::b_fs_yx_fsv16)
+    if (input.GetLayout() != DataLayout::fs_b_yx_fsv32 &&
+        input.GetLayout() != DataLayout::b_fs_yx_fsv16 &&
+        input.GetLayout() != DataLayout::b_fs_yx_fsv32 &&
+        input.GetLayout() != DataLayout::bs_fs_yx_bsv32_fsv16 &&
+        input.GetLayout() != DataLayout::bs_fs_yx_bsv32_fsv32)
         return false;
 
     return true;
@@ -100,9 +129,15 @@ bool ResampleKernelOpt::Validate(const Params& p, const optional_params& o) cons
 JitConstants ResampleKernelOpt::GetJitConstants(const resample_params &params) const {
     auto jit = Parent::GetJitConstants(params);
 
-    jit.AddConstant(MakeJitConstant("OUTPUT_X_BLOCK_SIZE", GetOptimalBlockSize(params)));
+    auto opt_x_block_size = GetOptimalBlockSize(params);
+    if (params.output.X().v > 32 && opt_x_block_size == 1) {
+        opt_x_block_size = GetOptimalDivisor(params.output.X().v, 32);
+    }
+
+    jit.AddConstant(MakeJitConstant("OUTPUT_X_BLOCK_SIZE", opt_x_block_size));
+    jit.AddConstant(MakeJitConstant("X_BLOCKS", CeilDiv(params.output.X().v, opt_x_block_size)));
     jit.AddConstant(MakeJitConstant("SUB_GROUP_SIZE", sub_group_size));
-    jit.AddConstant(MakeJitConstant("X_BLOCKS", CeilDiv(params.output.X().v, GetOptimalBlockSize(params))));
+
     size_t vec_size = 0;
     if (params.inputs[0].GetLayout() == DataLayout::fs_b_yx_fsv32) {
         vec_size = 2;
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/resample/resample_kernel_ref.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/resample/resample_kernel_ref.cpp
index da2462df1a9..fad6d77dd06 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/resample/resample_kernel_ref.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/resample/resample_kernel_ref.cpp
@@ -50,6 +50,7 @@ static size_t packing_factor(const resample_params& params) {
     auto get_layout_packing_factor = [](const DataLayout& layout) -> size_t {
         switch (layout) {
         case DataLayout::b_fs_yx_fsv16:
+        case DataLayout::bs_fs_yx_bsv32_fsv16:
             return 16;
         case DataLayout::b_fs_yx_fsv4:
             return 4;
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/auto_tuner.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/auto_tuner.cpp
index 0c39d4e6923..89cf33bf226 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/auto_tuner.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/auto_tuner.cpp
@@ -317,6 +317,7 @@ void AutoTuner::RemoveKernel(const std::string& cacheFilePath,
 
 std::tuple<std::string, int> AutoTuner::LoadKernelOffline(TuningCache* deviceCache,
                                                           const Params& params) {
+    std::lock_guard<std::mutex> lock(mutex);
     static const uint32_t defaultComputeUnits = 24;
     if (!deviceCache)
         return {};
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/activation_ref.cl b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/activation_ref.cl
index 75cb142ede2..e4ef903a9bb 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/activation_ref.cl
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/activation_ref.cl
@@ -15,11 +15,11 @@
 KERNEL(activation)(
     __global INPUT0_TYPE* input,
     __global OUTPUT_TYPE* output
-#ifdef PARAMETERIZED
-    , __global ADDITIONAL_PARAMS_TYPE* params
-#endif
 #if HAS_FUSED_OPS_DECLS
     , FUSED_OPS_DECLS
+#endif
+#ifdef PARAMETERIZED
+    , __global ADDITIONAL_PARAMS_TYPE* params
 #endif
     )
 {
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/concatenation_gpu_simple_ref.cl b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/concatenation_gpu_simple_ref.cl
index a8663903970..e492b19fe06 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/concatenation_gpu_simple_ref.cl
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/concatenation_gpu_simple_ref.cl
@@ -20,6 +20,8 @@ inline uint FUNC(get_input_index)(uint b, uint f, uint w, uint z, uint y, uint x
     return GET_DATA_BS_FS_ZYX_BSV16_FSV16_INDEX(INPUT0, b, f, z, y, x);
 #elif INPUT0_LAYOUT_BS_FS_YX_BSV16_FSV16
     return GET_DATA_BS_FS_YX_BSV16_FSV16_INDEX(INPUT0, b, f, y, x);
+#elif INPUT0_LAYOUT_BS_FS_YX_BSV32_FSV32
+    return GET_DATA_BS_FS_YX_BSV32_FSV32_INDEX(INPUT0, b, f, y, x);
 #else
 #error concatenation_gpu_simple_ref.cl: input format - not supported
 #endif
@@ -40,6 +42,8 @@ inline uint FUNC(get_output_index)(uint b, uint f, uint w, uint z, uint y, uint
     return GET_DATA_BS_FS_ZYX_BSV16_FSV16_INDEX(OUTPUT, b, f, z, y, x);
 #elif OUTPUT_LAYOUT_BS_FS_YX_BSV16_FSV16
     return GET_DATA_BS_FS_YX_BSV16_FSV16_INDEX(OUTPUT, b, f, y, x);
+#elif OUTPUT_LAYOUT_BS_FS_YX_BSV32_FSV32
+    return GET_DATA_BS_FS_YX_BSV32_FSV32_INDEX(OUTPUT, b, f, y, x);
 #else
 #error concatenation_gpu_simple_ref.cl: output format - not supported
 #endif
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/fully_connected_gpu_bf_tiled.cl b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/fully_connected_gpu_bf_tiled.cl
index ed68578732e..5c0387115c4 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/fully_connected_gpu_bf_tiled.cl
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/fully_connected_gpu_bf_tiled.cl
@@ -4,6 +4,7 @@
 
 #include "include/common.cl"
 #include "include/data_types.cl"
+#include "include/fetch_data.cl"
 
 // JIT Parameters:
 // SIMD         - sub-group size/simd width, one of {8, 16};
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/include/fetch_data.cl b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/include/fetch_data.cl
index 5ca05e5d828..b50850d3f00 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/include/fetch_data.cl
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/include/fetch_data.cl
@@ -402,7 +402,7 @@ inline uint FUNC(get_bs_fs_zyx_bsv_fsv_index_safe)(uint b, uint f, uint z, uint
                                                   uint f_pad_before, uint f_pad_after,
                                                   uint z_pad_before, uint z_pad_after,
                                                   uint y_pad_before, uint y_pad_after,
-                                                  uint x_pad_before, uint x_pad_after, uint alignmentF, uint alignmentB) {
+                                                  uint x_pad_before, uint x_pad_after, uint alignmentB, uint alignmentF) {
     const uint b_mod = b % b_size;
     const uint f_mod = f_pad_before + (f % f_size);
     const uint fs = f_mod / alignmentF;
@@ -426,26 +426,26 @@ inline uint FUNC(get_bs_fs_zyx_bsv_fsv_index_safe)(uint b, uint f, uint z, uint
     return output_offset;
 }
 
-inline uint FUNC(get_bs_fs_zyx_bsv16_fsv16_index)(uint b, uint f,  uint z, uint y, uint x,
-                                                  uint x_size, uint y_size, uint z_size, uint f_size,
-                                                  uint f_pad_before, uint f_pad_after,
-                                                  uint z_pad_before, uint z_pad_after,
-                                                  uint y_pad_before, uint y_pad_after,
-                                                  uint x_pad_before, uint x_pad_after) {
-    const uint alignment = 16;
+inline uint FUNC(get_bs_fs_zyx_bsv_fsv_index)(uint b, uint f,  uint z, uint y, uint x,
+                                              uint x_size, uint y_size, uint z_size, uint f_size,
+                                              uint f_pad_before, uint f_pad_after,
+                                              uint z_pad_before, uint z_pad_after,
+                                              uint y_pad_before, uint y_pad_after,
+                                              uint x_pad_before, uint x_pad_after,
+                                              uint b_alignment, uint f_alignment) {
     const uint feature = f + f_pad_before;
-    const uint fs = feature / alignment;
-    const uint fsv = feature % alignment;
-    const uint bs = b / alignment;
-    const uint bsv = b % alignment;
+    const uint fs = feature / f_alignment;
+    const uint fsv = feature % f_alignment;
+    const uint bs = b / b_alignment;
+    const uint bsv = b % b_alignment;
 
-    const uint bsv_pitch = alignment;
-    const uint x_pitch = bsv_pitch * alignment;
+    const uint bsv_pitch = f_alignment;
+    const uint x_pitch = bsv_pitch * b_alignment;
     const uint y_pitch = x_pitch * (x_pad_before + x_size + x_pad_after);
     const uint z_pitch = y_pitch * (y_pad_before + y_size + y_pad_after);
     const uint fs_pitch = z_pitch * (z_pad_before + z_size + z_pad_after);
     const uint total_f_size = f_pad_before + f_size + f_pad_after;
-    const uint bs_pitch = fs_pitch * ((total_f_size + alignment - 1) / alignment);
+    const uint bs_pitch = fs_pitch * ((total_f_size + f_alignment - 1) / f_alignment);
 
     const uint output_offset = bs * bs_pitch +
                                fs * fs_pitch +
@@ -458,8 +458,8 @@ inline uint FUNC(get_bs_fs_zyx_bsv16_fsv16_index)(uint b, uint f,  uint z, uint
     return output_offset;
 }
 
-#define GET_DATA_BS_FS_YX_BSV16_FSV16_INDEX(prefix, b, f, y, x) \
-    FUNC_CALL(get_bs_fs_zyx_bsv16_fsv16_index)(                     \
+#define GET_DATA_BS_FS_YX_BSV16_FSV16_INDEX(prefix, b, f, y, x)     \
+    FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index)(                         \
         b, f, 0, y, x,                                              \
         CAT(prefix, _SIZE_X),                                       \
         CAT(prefix, _SIZE_Y),                                       \
@@ -472,10 +472,74 @@ inline uint FUNC(get_bs_fs_zyx_bsv16_fsv16_index)(uint b, uint f,  uint z, uint
         CAT(prefix, _PAD_BEFORE_SIZE_Y),                            \
         CAT(prefix, _PAD_AFTER_SIZE_Y),                             \
         CAT(prefix, _PAD_BEFORE_SIZE_X),                            \
-        CAT(prefix, _PAD_AFTER_SIZE_X))
+        CAT(prefix, _PAD_AFTER_SIZE_X), 16, 16)
+
+#define GET_DATA_BS_FS_YX_BSV32_FSV32_INDEX(prefix, b, f, y, x)     \
+    FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index)(                         \
+        b, f, 0, y, x,                                              \
+        CAT(prefix, _SIZE_X),                                       \
+        CAT(prefix, _SIZE_Y),                                       \
+        CAT(prefix, _SIZE_Z),                                       \
+        CAT(prefix, _FEATURE_NUM),                                  \
+        CAT(prefix, _PAD_BEFORE_FEATURE_NUM),                       \
+        CAT(prefix, _PAD_AFTER_FEATURE_NUM),                        \
+        CAT(prefix, _PAD_BEFORE_SIZE_Z),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_Z),                             \
+        CAT(prefix, _PAD_BEFORE_SIZE_Y),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_Y),                             \
+        CAT(prefix, _PAD_BEFORE_SIZE_X),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_X), 32, 32)
+
+#define GET_DATA_BS_FS_YX_BSV4_FSV4_INDEX(prefix, b, f, y, x)       \
+    FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index)(                         \
+        b, f, 0, y, x,                                              \
+        CAT(prefix, _SIZE_X),                                       \
+        CAT(prefix, _SIZE_Y),                                       \
+        CAT(prefix, _SIZE_Z),                                       \
+        CAT(prefix, _FEATURE_NUM),                                  \
+        CAT(prefix, _PAD_BEFORE_FEATURE_NUM),                       \
+        CAT(prefix, _PAD_AFTER_FEATURE_NUM),                        \
+        CAT(prefix, _PAD_BEFORE_SIZE_Z),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_Z),                             \
+        CAT(prefix, _PAD_BEFORE_SIZE_Y),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_Y),                             \
+        CAT(prefix, _PAD_BEFORE_SIZE_X),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_X), 4, 4)
+
+#define GET_DATA_BS_FS_YX_BSV4_FSV2_INDEX(prefix, b, f, y, x)       \
+    FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index)(                         \
+        b, f, 0, y, x,                                              \
+        CAT(prefix, _SIZE_X),                                       \
+        CAT(prefix, _SIZE_Y),                                       \
+        CAT(prefix, _SIZE_Z),                                       \
+        CAT(prefix, _FEATURE_NUM),                                  \
+        CAT(prefix, _PAD_BEFORE_FEATURE_NUM),                       \
+        CAT(prefix, _PAD_AFTER_FEATURE_NUM),                        \
+        CAT(prefix, _PAD_BEFORE_SIZE_Z),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_Z),                             \
+        CAT(prefix, _PAD_BEFORE_SIZE_Y),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_Y),                             \
+        CAT(prefix, _PAD_BEFORE_SIZE_X),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_X), 4, 2)
+
+#define GET_DATA_BS_FS_YX_BSV32_FSV16_INDEX(prefix, b, f, y, x)     \
+    FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index)(                         \
+        b, f, 0, y, x,                                              \
+        CAT(prefix, _SIZE_X),                                       \
+        CAT(prefix, _SIZE_Y),                                       \
+        CAT(prefix, _SIZE_Z),                                       \
+        CAT(prefix, _FEATURE_NUM),                                  \
+        CAT(prefix, _PAD_BEFORE_FEATURE_NUM),                       \
+        CAT(prefix, _PAD_AFTER_FEATURE_NUM),                        \
+        CAT(prefix, _PAD_BEFORE_SIZE_Z),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_Z),                             \
+        CAT(prefix, _PAD_BEFORE_SIZE_Y),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_Y),                             \
+        CAT(prefix, _PAD_BEFORE_SIZE_X),                            \
+        CAT(prefix, _PAD_AFTER_SIZE_X), 32, 16)
 
 #define GET_DATA_BS_FS_ZYX_BSV16_FSV16_INDEX(prefix, b, f, z, y, x) \
-    FUNC_CALL(get_bs_fs_zyx_bsv16_fsv16_index)(                     \
+    FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index)(                         \
         b, f, z, y, x,                                              \
         CAT(prefix, _SIZE_X),                                       \
         CAT(prefix, _SIZE_Y),                                       \
@@ -488,7 +552,7 @@ inline uint FUNC(get_bs_fs_zyx_bsv16_fsv16_index)(uint b, uint f,  uint z, uint
         CAT(prefix, _PAD_BEFORE_SIZE_Y),                            \
         CAT(prefix, _PAD_AFTER_SIZE_Y),                             \
         CAT(prefix, _PAD_BEFORE_SIZE_X),                            \
-        CAT(prefix, _PAD_AFTER_SIZE_X))
+        CAT(prefix, _PAD_AFTER_SIZE_X), 16, 16)
 
 #define GET_DATA_BS_FS_YX_BSV16_FSV16_INDEX_SAFE(prefix, b, f, y, x) \
     FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index_safe)(                     \
@@ -507,6 +571,74 @@ inline uint FUNC(get_bs_fs_zyx_bsv16_fsv16_index)(uint b, uint f,  uint z, uint
         CAT(prefix, _PAD_BEFORE_SIZE_X),                             \
         CAT(prefix, _PAD_AFTER_SIZE_X), 16, 16)
 
+#define GET_DATA_BS_FS_YX_BSV32_FSV32_INDEX_SAFE(prefix, b, f, y, x) \
+    FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index_safe)(                     \
+        b, f, 0, y, x,                                               \
+        CAT(prefix, _SIZE_X),                                        \
+        CAT(prefix, _SIZE_Y),                                        \
+        CAT(prefix, _SIZE_Z),                                        \
+        CAT(prefix, _FEATURE_NUM),                                   \
+        CAT(prefix, _BATCH_NUM),                                     \
+        CAT(prefix, _PAD_BEFORE_FEATURE_NUM),                        \
+        CAT(prefix, _PAD_AFTER_FEATURE_NUM),                         \
+        CAT(prefix, _PAD_BEFORE_SIZE_Z),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_Z),                              \
+        CAT(prefix, _PAD_BEFORE_SIZE_Y),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_Y),                              \
+        CAT(prefix, _PAD_BEFORE_SIZE_X),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_X), 32, 32)
+
+#define GET_DATA_BS_FS_YX_BSV4_FSV4_INDEX_SAFE(prefix, b, f, y, x)   \
+    FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index_safe)(                     \
+        b, f, 0, y, x,                                               \
+        CAT(prefix, _SIZE_X),                                        \
+        CAT(prefix, _SIZE_Y),                                        \
+        CAT(prefix, _SIZE_Z),                                        \
+        CAT(prefix, _FEATURE_NUM),                                   \
+        CAT(prefix, _BATCH_NUM),                                     \
+        CAT(prefix, _PAD_BEFORE_FEATURE_NUM),                        \
+        CAT(prefix, _PAD_AFTER_FEATURE_NUM),                         \
+        CAT(prefix, _PAD_BEFORE_SIZE_Z),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_Z),                              \
+        CAT(prefix, _PAD_BEFORE_SIZE_Y),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_Y),                              \
+        CAT(prefix, _PAD_BEFORE_SIZE_X),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_X), 4, 4)
+
+#define GET_DATA_BS_FS_YX_BSV4_FSV2_INDEX_SAFE(prefix, b, f, y, x)   \
+    FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index_safe)(                     \
+        b, f, 0, y, x,                                               \
+        CAT(prefix, _SIZE_X),                                        \
+        CAT(prefix, _SIZE_Y),                                        \
+        CAT(prefix, _SIZE_Z),                                        \
+        CAT(prefix, _FEATURE_NUM),                                   \
+        CAT(prefix, _BATCH_NUM),                                     \
+        CAT(prefix, _PAD_BEFORE_FEATURE_NUM),                        \
+        CAT(prefix, _PAD_AFTER_FEATURE_NUM),                         \
+        CAT(prefix, _PAD_BEFORE_SIZE_Z),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_Z),                              \
+        CAT(prefix, _PAD_BEFORE_SIZE_Y),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_Y),                              \
+        CAT(prefix, _PAD_BEFORE_SIZE_X),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_X), 4, 2)
+
+#define GET_DATA_BS_FS_YX_BSV32_FSV16_INDEX_SAFE(prefix, b, f, y, x) \
+    FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index_safe)(                     \
+        b, f, 0, y, x,                                               \
+        CAT(prefix, _SIZE_X),                                        \
+        CAT(prefix, _SIZE_Y),                                        \
+        CAT(prefix, _SIZE_Z),                                        \
+        CAT(prefix, _FEATURE_NUM),                                   \
+        CAT(prefix, _BATCH_NUM),                                     \
+        CAT(prefix, _PAD_BEFORE_FEATURE_NUM),                        \
+        CAT(prefix, _PAD_AFTER_FEATURE_NUM),                         \
+        CAT(prefix, _PAD_BEFORE_SIZE_Z),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_Z),                              \
+        CAT(prefix, _PAD_BEFORE_SIZE_Y),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_Y),                              \
+        CAT(prefix, _PAD_BEFORE_SIZE_X),                             \
+        CAT(prefix, _PAD_AFTER_SIZE_X), 32, 16)
+
 #define GET_DATA_BS_FS_ZYX_BSV16_FSV16_INDEX_SAFE(prefix, b, f, z, y, x) \
     FUNC_CALL(get_bs_fs_zyx_bsv_fsv_index_safe)(                         \
         b, f, z, y, x,                                                   \
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/include/fetch_weights.cl b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/include/fetch_weights.cl
index d0806b4249f..601990cb7d1 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/include/fetch_weights.cl
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/include/fetch_weights.cl
@@ -606,6 +606,95 @@ inline uint FUNC(get_os_is_zyx_osa4_isa8_osv8_isv4_swizzled_by_4_index)(uint o,
     return idx;
 }
 
+inline uint FUNC(get_g_os_is_yx_osa4_isa8_osv8_isv4)(uint g, uint o, uint i, uint y, uint x,
+                                                     uint size_x, uint size_y, uint size_ifm, uint size_ofm, uint offset)
+{
+    const uint isv_idx = i % 4;
+    const uint isa_idx = (i / 4) % 8;
+    const uint is_idx = (i / 32);
+    const uint osv_idx = o % 8;
+    const uint osa_idx = (o / 8) % 4;
+    const uint os_idx = (o / 32);
+
+    const uint ifm_32_aligned = ((size_ifm + 31)/32);
+    const uint ofm_32_aligned = ((size_ofm + 31)/32);
+
+    size_t idx = offset +
+                 isv_idx +
+                 osv_idx * 4 +
+                 isa_idx * 8 * 4 +
+                 osa_idx * 8 * 32 +
+                 x * 32 * 32 +
+                 y * size_x * 32 * 32 +
+                 is_idx * 32 * 32 * size_x * size_y +
+                 os_idx * 32 * 32 * ifm_32_aligned * size_x * size_y +
+                 g * 32 * 32 * ifm_32_aligned * ofm_32_aligned * size_x * size_y;
+
+    return idx;
+}
+
+inline uint FUNC(get_g_os_is_yx_osa4_isa8_osv8_isv2)(uint g, uint o, uint i, uint y, uint x, uint size_x, uint size_y, uint size_ifm, uint size_ofm, uint offset)
+{
+    const uint isv_idx = i % 2;
+    const uint isa_idx = (i / 2) % 8;
+    const uint is_idx = (i / 16);
+    const uint osv_idx = o % 8;
+    const uint osa_idx = (o / 8) % 4;
+    const uint os_idx = (o / 32);
+
+    const uint ifm_16_aligned = ((size_ifm + 15)/16);
+    const uint ofm_32_aligned = ((size_ifm + 31)/32);
+
+    size_t idx = offset +
+                 isv_idx +
+                 osv_idx * 2 +
+                 isa_idx * 8 * 2 +
+                 osa_idx * 8 * 16 +
+                 x * 32 * 16 +
+                 y * size_x * 32 * 16 +
+                 is_idx * 32 * 16 * size_x * size_y +
+                 os_idx * 32 * 16 * ifm_16_aligned * size_x * size_y +
+                 g * 32 * 16 * ifm_16_aligned * ofm_32_aligned * size_x * size_y;
+
+    return idx;
+}
+
+#define GET_FILTER_OS_IS_YX_OSA4_ISA8_OSV8_ISV4_INDEX(prefix, o, i, y, x) \
+    FUNC_CALL(get_g_os_is_yx_osa4_isa8_osv8_isv4)(                        \
+        0, o, i, y, x,                                                    \
+        CAT(prefix, _SIZE_X),                                             \
+        CAT(prefix, _SIZE_Y),                                             \
+        CAT(prefix, _IFM_NUM),                                            \
+        CAT(prefix, _OFM_NUM),                                            \
+        CAT(prefix, _OFFSET))
+
+#define GET_FILTER_G_OS_IS_YX_OSA4_ISA8_OSV8_ISV4_INDEX(prefix, g, o, i, y, x) \
+    FUNC_CALL(get_g_os_is_yx_osa4_isa8_osv8_isv4)(                             \
+        g, o, i, y, x,                                                         \
+        CAT(prefix, _SIZE_X),                                                  \
+        CAT(prefix, _SIZE_Y),                                                  \
+        CAT(prefix, _IFM_NUM),                                                 \
+        CAT(prefix, _OFM_NUM),                                                 \
+        CAT(prefix, _OFFSET))
+
+#define GET_FILTER_OS_IS_YX_OSA4_ISA8_OSV8_ISV2_INDEX(prefix, o, i, y, x) \
+    FUNC_CALL(get_g_os_is_yx_osa4_isa8_osv8_isv2)(                        \
+        0, o, i, y, x,                                                    \
+        CAT(prefix, _SIZE_X),                                             \
+        CAT(prefix, _SIZE_Y),                                             \
+        CAT(prefix, _IFM_NUM),                                            \
+        CAT(prefix, _OFM_NUM),                                            \
+        CAT(prefix, _OFFSET))
+
+#define GET_FILTER_G_OS_IS_YX_OSA4_ISA8_OSV8_ISV2_INDEX(prefix, g, o, i, y, x) \
+    FUNC_CALL(get_g_os_is_yx_osa4_isa8_osv8_isv2)(                             \
+        g, o, i, y, x,                                                         \
+        CAT(prefix, _SIZE_X),                                                  \
+        CAT(prefix, _SIZE_Y),                                                  \
+        CAT(prefix, _IFM_NUM),                                                 \
+        CAT(prefix, _OFM_NUM),                                                 \
+        CAT(prefix, _OFFSET))
+
 #define GET_FILTER_OS_IS_YX_ISA8_OSV8_ISV4_SWIZZLED_BY_4_INDEX(prefix, o, i, y, x) \
 	FUNC_CALL(get_os_is_yx_isa8_osv8_isv4_swizzled_by_4_index)(                    \
         o, i, y, x, CAT(prefix, _SIZE_X ),                                         \
@@ -722,7 +811,7 @@ inline uint FUNC(get_os_is_y_x8_osv8_isv4_swizzled_by_4_index)(uint o, uint i, u
         CAT(prefix, _SIZE_X),                                    \
         CAT(prefix, _SIZE_Y),                                    \
         CAT(prefix, _OFM_NUM),                                   \
-        CAT(prefix, _IFM_NUM))
+        CAT(prefix, _IFM_NUM), 16, 4)
 
 inline uint FUNC(get_g_os_is_yx_osv16_isv4)(uint g, uint o, uint i, uint y, uint x,
                                           uint i_size,
@@ -730,14 +819,14 @@ inline uint FUNC(get_g_os_is_yx_osv16_isv4)(uint g, uint o, uint i, uint y, uint
                                           uint x_size,
                                           uint y_size,
                                           uint o_num,
-                                          uint i_num)
+                                          uint i_num,
+                                          uint otd,
+                                          uint tile)
 {
-    const uint otd = 16;
     uint out_depth_tile = o / otd;
     uint od             = o - out_depth_tile * otd;
     uint output_slice_size = (o_num + otd - 1) / otd;
 
-    const uint tile = 4;
     uint id_tile = i / tile;
     uint id      = i - id_tile * tile;
     uint input_slice_size = (i_num + tile - 1) / tile;
@@ -753,6 +842,26 @@ inline uint FUNC(get_g_os_is_yx_osv16_isv4)(uint g, uint o, uint i, uint y, uint
     return idx;
 }
 
+#define GET_FILTER_OS_IS_YX_OSV8_ISV2_INDEX(prefix, o, i, y, x) \
+    FUNC_CALL(get_g_os_is_yx_osv16_isv4)(                       \
+        0, o, i, y, x,                                          \
+        CAT(prefix, _IFM_PITCH),                                \
+        CAT(prefix, _OFM_PITCH),                                \
+        CAT(prefix, _SIZE_X),                                   \
+        CAT(prefix, _SIZE_Y),                                   \
+        CAT(prefix, _OFM_NUM),                                  \
+        CAT(prefix, _IFM_NUM), 8, 2)
+
+#define GET_FILTER_OS_IS_YX_OSV8_ISV4_INDEX(prefix, o, i, y, x) \
+    FUNC_CALL(get_g_os_is_yx_osv16_isv4)(                       \
+        0, o, i, y, x,                                          \
+        CAT(prefix, _IFM_PITCH),                                \
+        CAT(prefix, _OFM_PITCH),                                \
+        CAT(prefix, _SIZE_X),                                   \
+        CAT(prefix, _SIZE_Y),                                   \
+        CAT(prefix, _OFM_NUM),                                  \
+        CAT(prefix, _IFM_NUM), 8, 4)
+
 #define GET_FILTER_OS_IS_YX_OSV16_ISV4_INDEX(prefix, o, i, y, x) \
     FUNC_CALL(get_os_is_zyx_osv_isv4)(                           \
         o, i, 0, y, x,                                           \
@@ -1116,3 +1225,23 @@ inline uint FUNC(get_g_os_zyx_is_osv_isv_index)(uint g, uint o, uint i, uint z,
 #define GET_FILTER_G_OS_ZYX_IS_OSV32_ISV4_INDEX(tensor, g, o, i, z, y, x)   GET_FILTER_G_OS_ZYX_IS_OSV_ISV_INDEX(tensor, g, o, i, z, y, x, 32, 4)
 #define GET_FILTER_G_OS_ZYX_IS_OSV32_ISV16_INDEX(tensor, g, o, i, z, y, x)  GET_FILTER_G_OS_ZYX_IS_OSV_ISV_INDEX(tensor, g, o, i, z, y, x, 32, 16)
 #define GET_FILTER_G_OS_ZYX_IS_OSV32_ISV32_INDEX(tensor, g, o, i, z, y, x)  GET_FILTER_G_OS_ZYX_IS_OSV_ISV_INDEX(tensor, g, o, i, z, y, x, 32, 32)
+
+#define GET_FILTER_O_IS_YX_ISV16_INDEX(prefix, o, i, y, x, isv) \
+    CAT(prefix, _OFFSET) +                                      \
+    ((i) % (isv)) +                                             \
+    (o)*CAT(prefix, _OFM_PITCH) +                               \
+    (isv)*(                                                     \
+        (x)*CAT(prefix, _X_PITCH) +                             \
+        (y)*CAT(prefix, _Y_PITCH) +                             \
+        ((i) / (isv))*CAT(prefix, _IFM_PITCH)                   \
+    )
+
+#define GET_FILTER_OS_YXI_OSV16(prefix, o, i, y, x) \
+    CAT(prefix, _OFFSET) +                          \
+    ((o) % (16)) +                                  \
+    (16)*(                                          \
+        (x)*CAT(prefix, _X_PITCH) +                 \
+        (y)*CAT(prefix, _Y_PITCH) +                 \
+        (i)*CAT(prefix, _IFM_PITCH) +               \
+        ((o) / (16))*CAT(prefix, _OFM_PITCH)        \
+    )
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/pooling_gpu_int8_ref.cl b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/pooling_gpu_int8_ref.cl
index bb7aa6f3753..4a44d357c83 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/pooling_gpu_int8_ref.cl
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/pooling_gpu_int8_ref.cl
@@ -75,7 +75,7 @@ KERNEL(pooling_gpu_int8_ref)(
     const uint f    = bf / INPUT0_BATCH_NUM;
     const uint b    = bf % INPUT0_BATCH_NUM;
     const uint z    = 0;
-#elif OUTPUT_LAYOUT_B_FS_YX_FSV16
+#elif OUTPUT_LAYOUT_B_FS_YX_FSV16 || OUTPUT_LAYOUT_BS_FS_YX_BSV32_FSV32
     const uint x = get_global_id(1);
     const uint y = get_global_id(2);
     const uint bf = (uint)get_global_id(0);
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/reorder_data_to_yxfb_batched.cl b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/reorder_data_to_yxfb_batched.cl
index ab0bb401344..e083ef2726a 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/reorder_data_to_yxfb_batched.cl
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/reorder_data_to_yxfb_batched.cl
@@ -10,21 +10,8 @@
 ///////////////////////// Input Index /////////////////////////
 inline uint FUNC(get_input_index)(uint b, uint f, uint y, uint x)
 {
-#if   INPUT0_SIMPLE
-    return GET_DATA_INDEX(INPUT0, b, f, y, x);
-#elif defined INPUT0_LAYOUT_BS_F_BSV8__AF8  || \
-      defined INPUT0_LAYOUT_BS_F_BSV16__AF8
-    return GET_DATA_BS_FYX_BSV8_INDEX(INPUT0, b, f, y, x, SUB_GROUP_SIZE);
-#elif defined INPUT0_LAYOUT_B_FS_YX_FSV16
-    return GET_DATA_B_FS_YX_FSV16_INDEX(INPUT0, b, f, y, x);
-#elif defined INPUT0_LAYOUT_FS_B_YX_FSV32
-    return GET_DATA_FS_B_YX_FSV32_INDEX(INPUT0, b, f, y, x);
-#elif defined INPUT0_LAYOUT_B_FS_ZYX_FSV16
-    return GET_DATA_B_FS_ZYX_FSV16_INDEX(INPUT0, b, f, 0, y, x);
-#elif defined INPUT0_LAYOUT_BS_FS_ZYX_BSV16_FSV16
-    return GET_DATA_BS_FS_ZYX_BSV16_FSV16_INDEX(INPUT0, b, f, 0, y, x);
-#elif defined INPUT0_LAYOUT_BS_FS_YX_BSV16_FSV16
-    return GET_DATA_BS_FS_YX_BSV16_FSV16_INDEX(INPUT0, b, f, y, x);
+#if INPUT0_DIMS == 4
+    return INPUT0_GET_INDEX(b, f, y, x);
 #else
 #error reorder_data_to_yxfb_batched.cl: input format - not supported
 #endif
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/reorder_weights.cl b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/reorder_weights.cl
index d371981d57a..4710d8dbb2f 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/reorder_weights.cl
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/reorder_weights.cl
@@ -32,6 +32,8 @@ inline uint FUNC(get_input_index)(uint g, uint o, uint i, uint z, uint y, uint x
     return GET_FILTER_OS_IYX_OSV8_INDEX(INPUT0, o, i, y, x, 32);
 #elif defined INPUT0_LAYOUT_OS_IYX_OSV32__AI32
     return GET_FILTER_OS_IYX_OSV32__AI32_INDEX(OUTPUT, o, i, y, x, 32);
+#elif defined INPUT0_LAYOUT_O_IS_YX_ISV16
+    return GET_FILTER_O_IS_YX_ISV16_INDEX(INPUT0, o, i, y, x, 16);
 #elif defined INPUT0_LAYOUT_IYX_OSV64
     return GET_FILTER_OS_IYX_OSV8_INDEX(INPUT0, o, i, y, x, 64);
 #elif defined INPUT0_LAYOUT_OS_IYX_OSV16_ROTATE_180
@@ -100,6 +102,10 @@ inline uint FUNC(get_input_index)(uint g, uint o, uint i, uint z, uint y, uint x
     return GET_FILTER_OS_IS_YX_OSV16_ISV16_INDEX(INPUT0, o, i, y, x);
 #elif defined INPUT0_LAYOUT_OS_IS_ZYX_OSV16_ISV16
     return GET_FILTER_OS_IS_ZYX_OSV16_ISV16_INDEX(INPUT0, o, i, z, y, x);
+#elif defined INPUT0_LAYOUT_OS_IS_YX_OSV8_ISV2
+    return GET_FILTER_OS_IS_YX_OSV8_ISV2_INDEX(INPUT0, o, i, y, x);
+#elif defined INPUT0_LAYOUT_OS_IS_YX_OSV8_ISV4
+    return GET_FILTER_OS_IS_YX_OSV8_ISV4_INDEX(INPUT0, o, i, y, x);
 #elif defined INPUT0_LAYOUT_G_OS_IS_ZYX_OSV16_ISV16
     return GET_FILTER_G_OS_IS_ZYX_OSV16_ISV16_INDEX(INPUT0, g, o, i, z, y, x);
 #elif defined INPUT0_LAYOUT_OS_IS_ZYX_OSV32_ISV16
@@ -146,6 +152,8 @@ inline uint FUNC(get_output_index)(uint g, uint o, uint i, uint z, uint y, uint
     return GET_FILTER_OS_IYX_OSV32__AI32_INDEX(OUTPUT, o, i, y, x, 32);
 #elif defined OUTPUT_LAYOUT_OS_IYX_OSV64
     return GET_FILTER_OS_IYX_OSV8_INDEX(OUTPUT, o, i, y, x, 64);
+#elif defined OUTPUT_LAYOUT_O_IS_YX_ISV16
+    return GET_FILTER_O_IS_YX_ISV16_INDEX(OUTPUT, o, i, y, x, 16);
 #elif defined OUTPUT_LAYOUT_OS_IYX_OSV16_ROTATE_180
     return GET_FILTER_OS_IYX_OSV8_ROTATE_180_INDEX(OUTPUT, o, i, y, x, SUB_GROUP_SIZE);
 #elif defined OUTPUT_LAYOUT_I_YXS_OS_YXSV2_OSV16
@@ -172,6 +180,10 @@ inline uint FUNC(get_output_index)(uint g, uint o, uint i, uint z, uint y, uint
     return GET_FILTER_OS_IS_Y_X8_OSV8_ISV4_SWIZZLED_BY_4(OUTPUT, o, i, y, x);
 #elif defined OUTPUT_LAYOUT_OS_IS_YX_OSV16_ISV4
     return GET_FILTER_OS_IS_YX_OSV16_ISV4_INDEX(OUTPUT, o, i, y, x);
+#elif defined OUTPUT_LAYOUT_OS_IS_YX_OSV8_ISV2
+    return GET_FILTER_OS_IS_YX_OSV8_ISV2_INDEX(OUTPUT, o, i, y, x);
+#elif defined OUTPUT_LAYOUT_OS_IS_YX_OSV8_ISV4
+    return GET_FILTER_OS_IS_YX_OSV8_ISV4_INDEX(OUTPUT, o, i, y, x);
 #elif defined OUTPUT_LAYOUT_OS_IS_YX_OSV32_ISV4_SWIZZLED_BY_2
     return GET_FILTER_OS_IS_YX_OSV32_ISV4_SWIZZLED_BY_2_INDEX(OUTPUT, o, i, y, x);
 #elif defined OUTPUT_LAYOUT_OS_IS_YX_OSV32_ISV4
@@ -179,15 +191,23 @@ inline uint FUNC(get_output_index)(uint g, uint o, uint i, uint z, uint y, uint
 #elif defined OUTPUT_LAYOUT_OS_IS_ZYX_OSV32_ISV4
     return GET_FILTER_OS_IS_ZYX_OSV32_ISV4_INDEX(OUTPUT, o, i, z, y, x);
 #elif defined OUTPUT_LAYOUT_OS_IS_YX_ISA8_OSV8_ISV4_SWIZZLED_BY_4
-    return GET_FILTER_OS_IS_YX_ISA8_OSV8_ISV4_SWIZZLED_BY_4_INDEX(OUTPUT, o, i, y, x);
+    return GET_FILTER_OS_IS_YX_ISA8_OSV8_ISV4_SWIZZLED_BY_4_INDEX(OUTPUT, g, o, i, y, x);
+#elif defined OUTPUT_LAYOUT_G_OS_IS_YX_OSA4_ISA8_OSV8_ISV2
+    return GET_FILTER_G_OS_IS_YX_OSA4_ISA8_OSV8_ISV2_INDEX(OUTPUT, g, o, i, y, x);
+#elif defined OUTPUT_LAYOUT_G_OS_IS_YX_OSA4_ISA8_OSV8_ISV4
+    return GET_FILTER_G_OS_IS_YX_OSA4_ISA8_OSV8_ISV4_INDEX(OUTPUT, g, o, i, y, x);
+#elif defined OUTPUT_LAYOUT_OS_IS_YX_OSA4_ISA8_OSV8_ISV4
+    return GET_FILTER_OS_IS_YX_OSA4_ISA8_OSV8_ISV4_INDEX(OUTPUT, o, i, y, x);
+#elif defined OUTPUT_LAYOUT_OS_IS_YX_OSA4_ISA8_OSV8_ISV2
+    return GET_FILTER_OS_IS_YX_OSA4_ISA8_OSV8_ISV2_INDEX(OUTPUT, o, i, y, x);
 #elif defined OUTPUT_LAYOUT_OS_IS_YX_OSA4_ISA8_OSV8_ISV4_SWIZZLED_BY_4
     return GET_FILTER_OS_IS_YX_OSA4_ISA8_OSV8_ISV4_SWIZZLED_BY_4_INDEX(OUTPUT, o, i, y, x);
 #elif defined OUTPUT_LAYOUT_OS_IS_ZYX_OSA4_ISA8_OSV8_ISV4_SWIZZLED_BY_4
     return GET_FILTER_OS_IS_ZYX_OSA4_ISA8_OSV8_ISV4_SWIZZLED_BY_4_INDEX(OUTPUT, o, i, z, y, x);
 #elif defined OUTPUT_LAYOUT_OS_IS_YX_ISV16_OSV16
     return GET_FILTER_OS_IS_YX_ISV16_OSV16_INDEX(OUTPUT, o, i, y, x, SUB_GROUP_SIZE);
-#elif defined OUTPUT_LAYOUT_OIYX_O16
-    return GET_FILTER_OIYX_O16(OUTPUT, o, i, y, x);
+#elif defined OUTPUT_LAYOUT_OS_YXI_OSV16
+    return GET_FILTER_OS_YXI_OSV16(OUTPUT, o, i, y, x);
 #elif defined OUTPUT_LAYOUT_OS_IS_ZYX_ISV16_OSV16
     return GET_FILTER_OS_IS_ZYX_ISV16_OSV16_INDEX(OUTPUT, o, i, z, y, x, SUB_GROUP_SIZE);
 #elif defined OUTPUT_LAYOUT_IS_OS_ZYX_ISV16_OSV16
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/resample_opt.cl b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/resample_opt.cl
index f1f0f6b5299..2c9382802b4 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/resample_opt.cl
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/resample_opt.cl
@@ -246,13 +246,14 @@ KERNEL (resample_opt)(__global INPUT0_TYPE* input,
     if (feature_num >= OUTPUT_FEATURE_NUM)
         return;
 
-    unroll_for (uint out_x = 0; out_x < OUTPUT_X_BLOCK_SIZE; out_x++) {
 #ifdef SAMPLE_TYPE_NEAREST
+    unroll_for (uint out_x = 0; out_x < OUTPUT_X_BLOCK_SIZE; out_x++) {
         const int ix = floor((x + out_x) * SCALES[4]);
         const int iy = floor(y * SCALES[3]);
 
         in_vec_t res = READ_FUNC(input, INPUT0_GET_INDEX(b, feature_block, iy, ix));
 #elif defined(SAMPLE_TYPE_INTERP)
+    unroll_for (uint out_x = 0; out_x < OUTPUT_X_BLOCK_SIZE; out_x++) {
         const ACCUMULATOR_TYPE ix = TO_ACCUMULATOR_TYPE(SCALES[4]) * (x + out_x);
         const ACCUMULATOR_TYPE iy = TO_ACCUMULATOR_TYPE(SCALES[3]) * y;
 
@@ -273,22 +274,23 @@ KERNEL (resample_opt)(__global INPUT0_TYPE* input,
         const acc_vec_t bottom = TO_ACC_VEC_TYPE(bottom_left) + (TO_ACC_VEC_TYPE(bottom_right) - TO_ACC_VEC_TYPE(bottom_left)) * dx;
         acc_vec_t res = top + (bottom - top) * dy;
 #else // defined(SAMPLE_TYPE_LINEAR_ONNX)
-        const int PADDED_Y = INPUT0_SIZE_Y + PADS_BEGIN[3] + PADS_END[3];
-        const int PADDED_X = INPUT0_SIZE_X + PADS_BEGIN[4] + PADS_END[4];
+    const int PADDED_Y = INPUT0_SIZE_Y + PADS_BEGIN[3] + PADS_END[3];
+    const int PADDED_X = INPUT0_SIZE_X + PADS_BEGIN[4] + PADS_END[4];
 
+    const ACCUMULATOR_TYPE iy = FUNC_CALL(get_original_coordinate)(y, SCALES[3], OUTPUT_SIZE_Y, PADDED_Y);
+    float in_y = fmax(0, fmin(iy, PADDED_Y - 1));
+    int in_y1 = min((int)in_y, PADDED_Y - 1);
+    int in_y2 = min(in_y1 + 1, PADDED_Y - 1);
+    const ACCUMULATOR_TYPE dy1 = (in_y1 != in_y2) ? TO_ACCUMULATOR_TYPE(fabs(in_y - in_y1)) : 0.5f;
+    const ACCUMULATOR_TYPE dy2 = (in_y1 != in_y2) ? TO_ACCUMULATOR_TYPE(fabs(in_y - in_y2)) : 0.5f;
+
+    unroll_for (uint out_x = 0; out_x < OUTPUT_X_BLOCK_SIZE; out_x++) {
         const ACCUMULATOR_TYPE ix = FUNC_CALL(get_original_coordinate)(x + out_x, SCALES[4], OUTPUT_SIZE_X, PADDED_X);
-        const ACCUMULATOR_TYPE iy = FUNC_CALL(get_original_coordinate)(y, SCALES[3], OUTPUT_SIZE_Y, PADDED_Y);
-
-        float in_y = fmax(0, fmin(iy, PADDED_Y - 1));
         float in_x = fmax(0, fmin(ix, PADDED_X - 1));
-        int in_y1 = min((int)in_y, PADDED_Y - 1);
-        int in_y2 = min(in_y1 + 1, PADDED_Y - 1);
         int in_x1 = min((int)in_x, PADDED_X - 1);
         int in_x2 = min(in_x1 + 1, PADDED_X - 1);
         const ACCUMULATOR_TYPE dx1 = (in_x1 != in_x2) ? TO_ACCUMULATOR_TYPE(fabs(in_x - in_x1)) : 0.5f;
         const ACCUMULATOR_TYPE dx2 = (in_x1 != in_x2) ? TO_ACCUMULATOR_TYPE(fabs(in_x - in_x2)) : 0.5f;
-        const ACCUMULATOR_TYPE dy1 = (in_y1 != in_y2) ? TO_ACCUMULATOR_TYPE(fabs(in_y - in_y1)) : 0.5f;
-        const ACCUMULATOR_TYPE dy2 = (in_y1 != in_y2) ? TO_ACCUMULATOR_TYPE(fabs(in_y - in_y2)) : 0.5f;
 #if PADDING_USED == 1
         in_y1 -= PADS_BEGIN[3];
         in_y2 -= PADS_BEGIN[3];
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.cpp
index 813c375bf2a..6d25ab710f1 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.cpp
@@ -11,6 +11,7 @@
 #include <quantize/quantize_kernel_params.h>
 #include <eltwise/eltwise_kernel_base.h>
 #include <activation/activation_kernel_base.h>
+#include <inttypes.h>
 
 namespace {
 class JitTerm {
@@ -161,43 +162,38 @@ std::string getMeanOpString(MeanOp op) {
             return "";
     }
 }
+// Longest notation for value represented by double type has 24 chars
+static thread_local char buf[24 + 24 + 18] = "";
 
 std::string toCodeString(uint8_t val) {
-    std::stringstream ss;
-    ss.imbue(std::locale("C"));
-    ss << static_cast<int>(val);
-    return ss.str();
+    snprintf(buf, sizeof(buf), "%d", static_cast<int>(val));
+    return buf;
 }
 
 std::string toCodeString(int8_t val) {
-    std::stringstream ss;
-    ss.imbue(std::locale("C"));
-    ss << static_cast<int>(val);
-    return ss.str();
+    snprintf(buf, sizeof(buf), "%d", static_cast<int>(val));
+    return buf;
+}
+
+std::string toCodeString(size_t val) {
+    snprintf(buf, sizeof(buf), "%zu", val);
+    return buf;
 }
 
 std::string toCodeString(float val) {
     if (std::isinf(val))
         return std::signbit(val) ? "-INFINITY" : "INFINITY";
-    std::stringstream ss;
-    ss.imbue(std::locale("C"));
     // Workaround GCC compiler/STL bug
-    ss << "as_float(0x" << std::hex << *reinterpret_cast<uint32_t*>(&val) << ")";
-
-    ss << " /*" << std::scientific << val << "*/";
-    return ss.str();
+    snprintf(buf, sizeof(buf), "as_float(0x%" PRIx32 ")/*%.6e*/", *reinterpret_cast<uint32_t*>(&val), val);
+    return buf;
 }
 
 std::string toCodeString(double val) {
     if (std::isinf(val))
         return std::signbit(val) ? "-INFINITY" : "INFINITY";
-    std::stringstream ss;
-    ss.imbue(std::locale("C"));
     // Workaround GCC compiler/STL bug
-    ss << "as_double(0x" << std::hex << *reinterpret_cast<uint64_t*>(&val) << ")";
-
-    ss << " /*" << std::scientific << val << "*/";
-    return ss.str();
+    snprintf(buf, sizeof(buf), "as_double(0x%" PRIx64 ")/*%.6e*/", *reinterpret_cast<uint64_t*>(&val), val);
+    return buf;
 }
 
 JitDefinitions JitConstants::GetDefinitions() const {
@@ -336,13 +332,21 @@ JitDefinitions DataTensorJitConstant::GetDefinitions() const {
                        layout == DataLayout::b_fs_yx_fsv32 ||
                        layout == DataLayout::b_fs_yx_fsv4 ||
                        layout == DataLayout::fs_b_yx_fsv32 ||
-                       layout == DataLayout::bs_fs_yx_bsv16_fsv16) {
+                       layout == DataLayout::bs_fs_yx_bsv16_fsv16 ||
+                       layout == DataLayout::bs_fs_yx_bsv4_fsv4 ||
+                       layout == DataLayout::bs_fs_yx_bsv4_fsv2 ||
+                       layout == DataLayout::bs_fs_yx_bsv32_fsv16 ||
+                       layout == DataLayout::bs_fs_yx_bsv32_fsv32) {
                 auto layout_str = toString(layout);
                 index_func_val = "GET_DATA_" + layout_str + "_INDEX(" + _name + ", b, f, y, x)";
                 raw_index_func_val = "GET_DATA_" + layout_str + "_INDEX(" + _name + ", b, f, y, x)";
                 if (layout == DataLayout::b_fs_yx_fsv16 ||
                     layout == DataLayout::b_fs_yx_fsv32 ||
                     layout == DataLayout::b_fs_yx_fsv4  ||
+                    layout == DataLayout::bs_fs_yx_bsv32_fsv32  ||
+                    layout == DataLayout::bs_fs_yx_bsv32_fsv16  ||
+                    layout == DataLayout::bs_fs_yx_bsv4_fsv4  ||
+                    layout == DataLayout::bs_fs_yx_bsv4_fsv2  ||
                     layout == DataLayout::bs_fs_yx_bsv16_fsv16)
                     safe_index_func_val = "GET_DATA_" + layout_str + "_INDEX_SAFE(" + _name + ", b, f, y, x)";
                 else
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.h b/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.h
index 96ae2244cac..00f846a9868 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.h
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.h
@@ -91,6 +91,7 @@ inline std::string toCodeString(const char* val) { return val; }
 inline std::string toCodeString(bool val) { return val ? "1" : "0"; }
 std::string toCodeString(float val);
 std::string toCodeString(double val);
+std::string toCodeString(size_t val);
 std::string toCodeString(uint8_t val);
 std::string toCodeString(int8_t val);
 
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_selector_common.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_selector_common.cpp
index 1acd05cdc75..856e799850e 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_selector_common.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_selector_common.cpp
@@ -104,6 +104,10 @@ std::string toString(DataLayout l) {
         case kernel_selector::DataLayout::b_fs_zyx_fsv16:        return "B_FS_ZYX_FSV16";
         case kernel_selector::DataLayout::bs_fs_yx_bsv16_fsv16:  return "BS_FS_YX_BSV16_FSV16";
         case kernel_selector::DataLayout::bs_fs_zyx_bsv16_fsv16: return "BS_FS_ZYX_BSV16_FSV16";
+        case kernel_selector::DataLayout::bs_fs_yx_bsv4_fsv4:    return "BS_FS_YX_BSV4_FSV4";
+        case kernel_selector::DataLayout::bs_fs_yx_bsv4_fsv2:    return "BS_FS_YX_BSV4_FSV2";
+        case kernel_selector::DataLayout::bs_fs_yx_bsv32_fsv32:  return "BS_FS_YX_BSV32_FSV32";
+        case kernel_selector::DataLayout::bs_fs_yx_bsv32_fsv16:  return "BS_FS_YX_BSV32_FSV16";
         case kernel_selector::DataLayout::nv12:                  return "NV12";
         case kernel_selector::DataLayout::image_2d_rgba:         return "IMAGE_2D_RGBA";
         default:
@@ -308,6 +312,8 @@ std::string toString(WeightsLayout layout) {
         case WeightsLayout::os_is_zyx_osv16_isv16:                       return "OS_IS_ZYX_OSV16_ISV16";
         case WeightsLayout::os_is_zyx_osv32_isv16:                       return "OS_IS_ZYX_OSV32_ISV16";
         case WeightsLayout::os_is_zyx_osv64_isv16:                       return "OS_IS_ZYX_OSV64_ISV16";
+        case WeightsLayout::o_is_yx_isv16:                               return "O_IS_YX_ISV16";
+        case WeightsLayout::os_yxi_osv16:                                return "OS_YXI_OSV16";
         case WeightsLayout::os_iyx_osv16:                                return "OS_IYX_OSV16";
         case WeightsLayout::os_iyx_osv32:                                return "OS_IYX_OSV32";
         case WeightsLayout::os_iyx_osv32__ai32:                          return "OS_IYX_OSV32__AI32";
@@ -354,6 +360,9 @@ std::string toString(WeightsLayout layout) {
         case WeightsLayout::os_is_yx_isv8_osv16_isv2:                    return "OS_IS_YX_ISV8_OSV16_ISV2";
         case WeightsLayout::os_is_osv32_isv32_swizzled_by_4:             return "OS_IS_OSV32_ISV32_SWIZZLED_BY_4";
         case WeightsLayout::os_i_yxs_osv4_yxsv4:                         return "OS_I_YXS_OSV4_YXSV4";
+        case WeightsLayout::os_is_yx_osa4_isa8_osv8_isv4:                return "OS_IS_YX_OSA4_ISA8_OSV8_ISV4";
+        case WeightsLayout::os_is_yx_osv8_isv4:                          return "OS_IS_YX_OSV8_ISV4";
+        case WeightsLayout::os_is_yx_osv8_isv2:                          return "OS_IS_YX_OSV8_ISV2";
         case WeightsLayout::goiyx:                                       return "GOIYX";
         case WeightsLayout::gioyx:                                       return "GIOYX";
         case WeightsLayout::gyxio:                                       return "GYXIO";
@@ -375,6 +384,9 @@ std::string toString(WeightsLayout layout) {
         case WeightsLayout::gs_oi_yxs_gsv4_yxsv4:                        return "GS_OI_YXS_GSV4_YXSV4";
         case WeightsLayout::gs_oi_yxs_gsv16_yxsv4:                       return "GS_OI_YXS_GSV16_YXSV4";
         case WeightsLayout::gs_oi_yxs_gsv32_yxsv4:                       return "GS_OI_YXS_GSV32_YXSV4";
+        case WeightsLayout::g_os_is_yx_osa4_isa8_osv8_isv4:              return "G_OS_IS_YX_OSA4_ISA8_OSV8_ISV4";
+        case WeightsLayout::g_os_is_yx_osa4_isa8_osv8_isv2:              return "G_OS_IS_YX_OSA4_ISA8_OSV8_ISV2";
+        case WeightsLayout::os_is_yx_osa4_isa8_osv8_isv2:                return "OS_IS_YX_OSA4_ISA8_OSV8_ISV2";
         case WeightsLayout::g_os_is_yx_isv16_osv16:                      return "G_OS_IS_YX_ISV16_OSV16";
         case WeightsLayout::g_os_is_yx_osv16_isv4:                       return "G_OS_IS_YX_OSV16_ISV4";
         case WeightsLayout::g_os_is_zyx_osv16_isv16:                     return "G_OS_IS_ZYX_OSV16_ISV16";
diff --git a/inference-engine/thirdparty/clDNN/runtime/CMakeLists.txt b/inference-engine/thirdparty/clDNN/runtime/CMakeLists.txt
index 7a823a65121..3fabf155ea6 100644
--- a/inference-engine/thirdparty/clDNN/runtime/CMakeLists.txt
+++ b/inference-engine/thirdparty/clDNN/runtime/CMakeLists.txt
@@ -61,6 +61,13 @@ target_link_libraries("${CLDNN_BUILD__PROJ}" PRIVATE
     openvino::itt
   )
 
+if(ENABLE_ONEDNN_FOR_GPU)
+  add_dependencies("${CLDNN_BUILD__PROJ}" onednn_gpu_build)
+  target_link_libraries("${CLDNN_BUILD__PROJ}" PUBLIC ${ONEDNN_LIBRARY})
+  target_include_directories("${CLDNN_BUILD__PROJ}" PUBLIC ${ONEDNN_INCLUDE_DIRS})
+  target_compile_definitions("${CLDNN_BUILD__PROJ}" PUBLIC ENABLE_ONEDNN_FOR_GPU)
+endif()
+
 if(WIN32)
   target_link_libraries("${CLDNN_BUILD__PROJ}" PRIVATE setupapi)
 elseif((NOT ANDROID) AND (UNIX))
diff --git a/inference-engine/thirdparty/clDNN/runtime/memory_pool.cpp b/inference-engine/thirdparty/clDNN/runtime/memory_pool.cpp
index 74351fda54e..30863de6aae 100644
--- a/inference-engine/thirdparty/clDNN/runtime/memory_pool.cpp
+++ b/inference-engine/thirdparty/clDNN/runtime/memory_pool.cpp
@@ -9,6 +9,7 @@
 #include "cldnn/runtime/memory.hpp"
 #include "cldnn/runtime/engine.hpp"
 #include "cldnn/runtime/memory_pool.hpp"
+#include "cldnn/runtime/debug_configuration.hpp"
 
 #include <list>
 #include <string>
@@ -136,6 +137,10 @@ memory::ptr memory_pool::get_from_non_padded_pool(const layout& layout,
             ++it;
         }
     }
+    GPU_DEBUG_GET_INSTANCE(debug_config);
+    GPU_DEBUG_IF(debug_config->verbose >= 2) {
+        GPU_DEBUG_COUT << "[" << id << ": output]" << std::endl;
+    }
     // didn't find anything for you? create new resource
     auto mem = alloc_memory(layout, type);
     {
@@ -174,6 +179,10 @@ memory::ptr memory_pool::get_from_padded_pool(const layout& layout,
             memory_record({{id, network_id}}, mem, network_id, type));
         return mem;
     }
+    GPU_DEBUG_GET_INSTANCE(debug_config);
+    GPU_DEBUG_IF(debug_config->verbose >= 2) {
+        GPU_DEBUG_COUT << "[" << id << ": output]" << std::endl;
+    }
     auto mem = alloc_memory(layout, type);
     std::list<memory_record> list = {memory_record({{id, network_id}}, mem, network_id, type)};
     _padded_pool.emplace(layout, std::move(list));
diff --git a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_engine.cpp b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_engine.cpp
index a980a90f40b..0cf2964819a 100644
--- a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_engine.cpp
+++ b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_engine.cpp
@@ -29,6 +29,10 @@ cl::PFN_clCreateFromMediaSurfaceINTEL cl::ImageVA::pfn_clCreateFromMediaSurfaceI
 cl::PFN_clCreateFromD3D11Buffer cl::BufferDX::pfn_clCreateFromD3D11Buffer = NULL;
 #endif
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+#include <oneapi/dnnl/dnnl_ocl.hpp>
+#endif
+
 namespace cldnn {
 namespace ocl {
 
@@ -46,10 +50,22 @@ ocl_engine::ocl_engine(const device::ptr dev, runtime_types runtime_type, const
         throw std::runtime_error("[CLDNN] Invalid device type passed to ocl engine");
     casted->get_device().getInfo(CL_DEVICE_EXTENSIONS, &_extensions);
 
-    _program_stream.reset(new ocl_stream(*this));
     _usm_helper.reset(new cl::UsmHelper(get_cl_context(), get_cl_device(), use_unified_shared_memory()));
+
+#ifdef ENABLE_ONEDNN_FOR_GPU
+    _onednn_engine = std::make_shared<dnnl::engine>(dnnl::ocl_interop::make_engine(casted->get_device().get(), casted->get_context().get()));
+#endif
+    _program_stream.reset(new ocl_stream(*this));
 }
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+dnnl::engine& ocl_engine::get_onednn_engine() const {
+    if (!_onednn_engine)
+        throw std::runtime_error("[GPU] onednn engine is nullptr");
+    return *_onednn_engine;
+}
+#endif
+
 const cl::Context& ocl_engine::get_cl_context() const {
     auto cl_device = std::dynamic_pointer_cast<ocl_device>(_device);
     if (!cl_device)
@@ -73,6 +89,12 @@ memory::ptr ocl_engine::allocate_memory(const layout& layout, allocation_type ty
         throw std::runtime_error("exceeded max size of memory object allocation");
     }
 
+    if (type != allocation_type::cl_mem && !supports_allocation(type)) {
+        std::ostringstream type_str;
+        type_str << type;
+        throw std::runtime_error("Unsupported allocation type " + type_str.str());
+    }
+
     try {
         memory::ptr res = nullptr;
         if (layout.format.is_image_2d()) {
diff --git a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_engine.hpp b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_engine.hpp
index fbdf0e185e9..67995d65c7b 100644
--- a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_engine.hpp
+++ b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_engine.hpp
@@ -42,12 +42,21 @@ public:
     stream_ptr create_stream() const override;
     stream& get_program_stream() const override;
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+    /// Returns onednn engine object which shares device and context with current engine
+    dnnl::engine& get_onednn_engine() const override;
+#endif
+
     static std::shared_ptr<cldnn::engine> create(const device::ptr device, runtime_types runtime_type, const engine_configuration& configuration);
 
 private:
     std::string _extensions;
     std::unique_ptr<stream> _program_stream;
     std::unique_ptr<cl::UsmHelper> _usm_helper;
+
+#ifdef ENABLE_ONEDNN_FOR_GPU
+    std::shared_ptr<dnnl::engine> _onednn_engine;
+#endif
 };
 
 }  // namespace ocl
diff --git a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_memory.cpp b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_memory.cpp
index 0023213fe50..b7e3e8e96bb 100644
--- a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_memory.cpp
+++ b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_memory.cpp
@@ -11,6 +11,10 @@
 #include <stdexcept>
 #include <vector>
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+#include <oneapi/dnnl/dnnl_ocl.hpp>
+#endif
+
 namespace cldnn {
 namespace ocl {
 
@@ -92,6 +96,15 @@ event::ptr gpu_buffer::copy_from(stream& stream, const void* host_ptr) {
     return ev;
 }
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+dnnl::memory gpu_buffer::get_onednn_memory(dnnl::memory::desc desc) {
+    auto onednn_engine = _engine->get_onednn_engine();
+    dnnl::memory dnnl_mem(desc, onednn_engine, DNNL_MEMORY_NONE);
+    dnnl::ocl_interop::set_mem_object(dnnl_mem, _buffer.get());
+    return dnnl_mem;
+}
+#endif
+
 gpu_image2d::gpu_image2d(ocl_engine* engine, const layout& layout)
     : lockable_gpu_mem(), memory(engine, layout, allocation_type::cl_mem, false), _row_pitch(0), _slice_pitch(0) {
     cl_channel_type type = layout.data_type == data_types::f16 ? CL_HALF_FLOAT : CL_FLOAT;
@@ -343,6 +356,14 @@ event::ptr gpu_usm::copy_from(stream& stream, const void* host_ptr) {
     return ev;
 }
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+dnnl::memory gpu_usm::get_onednn_memory(dnnl::memory::desc desc) {
+    auto onednn_engine = _engine->get_onednn_engine();
+    dnnl::memory dnnl_mem = dnnl::ocl_interop::make_memory(desc, onednn_engine, dnnl::ocl_interop::memory_kind::usm, _buffer.get());
+    return dnnl_mem;
+}
+#endif
+
 shared_mem_params gpu_usm::get_internal_params() const {
     auto cl_engine = downcast<const ocl_engine>(_engine);
     return {
diff --git a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_memory.hpp b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_memory.hpp
index f7590e366b8..3de6b5deb98 100644
--- a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_memory.hpp
+++ b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_memory.hpp
@@ -42,6 +42,9 @@ struct gpu_buffer : public lockable_gpu_mem, public memory {
 
     event::ptr copy_from(stream& stream, const memory& other) override;
     event::ptr copy_from(stream& stream, const void* host_ptr) override;
+#ifdef ENABLE_ONEDNN_FOR_GPU
+    dnnl::memory get_onednn_memory(dnnl::memory::desc /* desc */) override;
+#endif
 
 protected:
     cl::Buffer _buffer;
@@ -110,6 +113,11 @@ struct gpu_usm : public lockable_gpu_mem, public memory {
 
     event::ptr copy_from(stream& stream, const memory& other) override;
     event::ptr copy_from(stream& stream, const void* host_ptr) override;
+
+#ifdef ENABLE_ONEDNN_FOR_GPU
+    dnnl::memory get_onednn_memory(dnnl::memory::desc desc) override;
+#endif
+
 protected:
     cl::UsmMemory _buffer;
 };
diff --git a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_stream.cpp b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_stream.cpp
index 910e5422603..6dfc2512342 100644
--- a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_stream.cpp
+++ b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_stream.cpp
@@ -28,6 +28,10 @@
 #pragma GCC diagnostic ignored "-Wignored-attributes"
 #endif
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+#include <oneapi/dnnl/dnnl_ocl.hpp>
+#endif
+
 namespace cldnn {
 namespace ocl {
 
@@ -273,8 +277,22 @@ ocl_stream::ocl_stream(const ocl_engine& engine) : stream(engine.configuration()
     queue_builder.set_throttle_mode(config.throttle_mode, throttle_extensions);
 
     _command_queue = queue_builder.build(context, device);
+#ifdef ENABLE_ONEDNN_FOR_GPU
+    if (config.queue_type == queue_types::in_order) {
+        auto onednn_engine = engine.get_onednn_engine();
+        _onednn_stream = std::make_shared<dnnl::stream>(dnnl::ocl_interop::make_stream(engine.get_onednn_engine(), _command_queue.get()));
+    }
+#endif
 }
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+dnnl::stream& ocl_stream::get_onednn_stream() {
+    if (!_onednn_stream)
+        throw std::runtime_error("[GPU] onednn stream is nullptr");
+    return *_onednn_stream;
+}
+#endif
+
 void ocl_stream::set_arguments(kernel& kernel, const kernel_arguments_desc& args_desc, const kernel_arguments_data& args) {
     static std::mutex m;
     std::lock_guard<std::mutex> guard(m);
diff --git a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_stream.hpp b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_stream.hpp
index eb2d3650acf..1bfd294bbbc 100644
--- a/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_stream.hpp
+++ b/inference-engine/thirdparty/clDNN/runtime/ocl/ocl_stream.hpp
@@ -79,6 +79,10 @@ public:
 
     const cl::UsmHelper& get_usm_helper() const { return _engine.get_usm_helper(); }
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+    dnnl::stream& get_onednn_stream() override;
+#endif
+
 private:
     void sync_events(std::vector<event::ptr> const& deps, bool is_output = false);
 
@@ -89,6 +93,10 @@ private:
     cl::Event _last_barrier_ev;
 
     sync_methods sync_method;
+
+#ifdef ENABLE_ONEDNN_FOR_GPU
+    std::shared_ptr<dnnl::stream> _onednn_stream = nullptr;
+#endif
 };
 
 }  // namespace ocl
diff --git a/inference-engine/thirdparty/clDNN/src/CMakeLists.txt b/inference-engine/thirdparty/clDNN/src/CMakeLists.txt
index 52a75de3ce8..9b19f79b814 100644
--- a/inference-engine/thirdparty/clDNN/src/CMakeLists.txt
+++ b/inference-engine/thirdparty/clDNN/src/CMakeLists.txt
@@ -48,6 +48,14 @@ file(GLOB __CLDNN_Sources__gpu
     "${__CLDNN_Directory__impls}/ocl/*.cpp"
   )
 
+if (ENABLE_ONEDNN_FOR_GPU)
+  file(GLOB __CLDNN_Sources__onednn
+      "${__CLDNN_Directory__impls}/onednn/*.hpp"
+      "${__CLDNN_Directory__impls}/onednn/*.cpp"
+    )
+  list(APPEND __CLDNN_Sources__gpu ${__CLDNN_Sources__onednn})
+endif()
+
 set(__CLDNN_Directory__cg_cache        "${CLDNN__CODEGEN_INCDIR}")
 set(__CLDNN_CGDirectory__cg_cache      "${CLDNN__CODEGEN_DIR}/cache")
 set(__CLDNN_Label__cg_cache            "${__CLDNN_Label__cache}\\codegen")
@@ -112,7 +120,13 @@ target_link_libraries("${CLDNN_BUILD__PROJ}" PRIVATE
     cldnn_kernel_selector
     openvino::itt
     cldnn_runtime
-  )
+)
+
+if(ENABLE_ONEDNN_FOR_GPU)
+  target_link_libraries("${CLDNN_BUILD__PROJ}" PUBLIC ${ONEDNN_LIBRARY})
+  target_include_directories("${CLDNN_BUILD__PROJ}" PUBLIC ${ONEDNN_INCLUDE_DIRS})
+  target_compile_definitions("${CLDNN_BUILD__PROJ}" PUBLIC ENABLE_ONEDNN_FOR_GPU)
+endif()
 
 if(COMMAND add_cpplint_target)
   add_cpplint_target("${CLDNN_BUILD__PROJ}_cpplint" FOR_TARGETS "${CLDNN_BUILD__PROJ}")
diff --git a/inference-engine/thirdparty/clDNN/src/graph_optimizer/graph_initializations.cpp b/inference-engine/thirdparty/clDNN/src/graph_optimizer/graph_initializations.cpp
index 24d45ecca78..0a1ba4156b7 100644
--- a/inference-engine/thirdparty/clDNN/src/graph_optimizer/graph_initializations.cpp
+++ b/inference-engine/thirdparty/clDNN/src/graph_optimizer/graph_initializations.cpp
@@ -346,6 +346,7 @@ void graph_initializations::handle_dynamic_lstm_node(program& p, lstm_dynamic_no
                                              dyn_length_id,
                                              weights_id,
                                              bias_id,
+                                             "",
                                              node.get_primitive()->output_padding);
     auto& lstm_dynamic_input_node = p.get_or_create(lstm_dynamic_input_primitive);
     p.add_connection(node.input(), lstm_dynamic_input_node);  // connect real input to dlstm_input
@@ -372,6 +373,7 @@ void graph_initializations::handle_dynamic_lstm_node(program& p, lstm_dynamic_no
                                                 init_cell_id,
                                                 node.clip(),
                                                 node.input_forget(),
+                                                "",
                                                 lstm_dynamic_input_primitive->output_padding);
     auto& lstm_dynamic_timeloop_node = p.get_or_create(lstm_dynamic_timeloop_primitive);
     p.add_connection(lstm_dynamic_input_node, lstm_dynamic_timeloop_node);  // connect dlstm_input to dlstm_timeloop
diff --git a/inference-engine/thirdparty/clDNN/src/graph_optimizer/pre_replace_deconv.cpp b/inference-engine/thirdparty/clDNN/src/graph_optimizer/pre_replace_deconv.cpp
index db2db73e4d5..7816ab6d4bd 100644
--- a/inference-engine/thirdparty/clDNN/src/graph_optimizer/pre_replace_deconv.cpp
+++ b/inference-engine/thirdparty/clDNN/src/graph_optimizer/pre_replace_deconv.cpp
@@ -119,6 +119,7 @@ void pre_replace_deconv::run(program& p) {
                                                               input_offset,
                                                               tensor{ 1, 1, 1, 1 },
                                                               grouped_weights_shape,
+                                                              "",
                                                               output_padding);
                 } else {
                     conv_prim = std::make_shared<convolution>(deconv_node_id,
@@ -129,6 +130,7 @@ void pre_replace_deconv::run(program& p) {
                                                               input_offset,
                                                               tensor{ 1, 1, 1, 1 },
                                                               grouped_weights_shape,
+                                                              "",
                                                               output_padding);
                 }
                 program_node& new_node = p.get_or_create(conv_prim);
@@ -263,6 +265,7 @@ void pre_replace_deconv::run(program& p) {
                                                                input_offset,
                                                                tensor{ 1, 1, 1, 1 },
                                                                grouped_weights_shape,
+                                                               "",
                                                                output_padding);
                 program_node& created_node = p.get_or_create(conv_prim);
 
diff --git a/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_primitive_fusing.cpp b/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_primitive_fusing.cpp
index d58593acde8..a12f51395cf 100644
--- a/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_primitive_fusing.cpp
+++ b/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_primitive_fusing.cpp
@@ -399,6 +399,12 @@ void prepare_primitive_fusing::fuse_simple_primitives(program &p) {
                   _lo.get_optimization_attributes().bs_fs_yx_bsv16_fsv16_network)) && node.get_primitive()->groups == 1)
                 return true;
 
+            if (node.get_output_layout().format == format::bs_fs_yx_bsv32_fsv32 || _lo.is_format_optimized(node, format::bs_fs_yx_bsv32_fsv32))
+                return true;
+
+            if (node.get_output_layout().format == format::bs_fs_yx_bsv32_fsv16 || _lo.is_format_optimized(node, format::bs_fs_yx_bsv32_fsv16))
+                return true;
+
             auto in_dt = node.get_dependency(0).get_output_layout().data_type;
 
             // TODO: check if that's enough for correct work
@@ -476,7 +482,7 @@ void prepare_primitive_fusing::fuse_simple_primitives(program &p) {
         };
 
         auto pooling_supports_fusings = [](pooling_node& node) -> bool {
-            auto pooling_mode = node.as<pooling>().get_primitive()->mode;
+            auto pooling_mode = node.get_primitive()->mode;
 
             if (pooling_mode != cldnn::pooling_mode::max_with_argmax)
                 return true;
diff --git a/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_quantization.cpp b/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_quantization.cpp
index 819cb87dd40..898fda4273a 100644
--- a/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_quantization.cpp
+++ b/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_quantization.cpp
@@ -657,6 +657,7 @@ void prepare_quantization::prepare_asymmetric_quantization(program &p, convoluti
                 old_conv_prim->dilation,
                 output_size,
                 old_conv_prim->grouped_weights_shape,
+                "",
                 old_conv_prim->output_padding);
 
     auto& new_conv_node = p.get_or_create(new_conv_prim);
diff --git a/inference-engine/thirdparty/clDNN/src/impls/common/wait_for_events.cpp b/inference-engine/thirdparty/clDNN/src/impls/common/wait_for_events.cpp
index 5f3d5e59651..0f23d1769f5 100644
--- a/inference-engine/thirdparty/clDNN/src/impls/common/wait_for_events.cpp
+++ b/inference-engine/thirdparty/clDNN/src/impls/common/wait_for_events.cpp
@@ -23,6 +23,7 @@ public:
 
     void init_kernels() override {}
     void set_arguments(primitive_inst& /*instance*/) override {}
+    std::vector<layout> get_internal_buffer_layouts() const override { return {}; }
 
     event::ptr execute(const std::vector<event::ptr>& events, primitive_inst& instance) override {
         auto& stream = instance.get_network().get_stream();
diff --git a/inference-engine/thirdparty/clDNN/src/impls/ocl/activation.cpp b/inference-engine/thirdparty/clDNN/src/impls/ocl/activation.cpp
index be9290ba986..37124b87e54 100644
--- a/inference-engine/thirdparty/clDNN/src/impls/ocl/activation.cpp
+++ b/inference-engine/thirdparty/clDNN/src/impls/ocl/activation.cpp
@@ -97,16 +97,32 @@ attach_activation_impl::attach_activation_impl() {
         std::make_tuple(data_types::f16, format::bfzyx),
         std::make_tuple(data_types::i8, format::bfzyx),
         std::make_tuple(data_types::i32, format::bfzyx),
+
         std::make_tuple(data_types::f32, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::f16, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::i8, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::u8, format::b_fs_zyx_fsv16),
+
         std::make_tuple(data_types::f32, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::f16, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::i8, format::bs_fs_zyx_bsv16_fsv16),
+        std::make_tuple(data_types::u8, format::bs_fs_zyx_bsv16_fsv16),
+
         std::make_tuple(data_types::f32, format::bs_fs_yx_bsv16_fsv16),
         std::make_tuple(data_types::f16, format::bs_fs_yx_bsv16_fsv16),
         std::make_tuple(data_types::i8, format::bs_fs_yx_bsv16_fsv16),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv16_fsv16),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv16),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv32),
+
         // bfwzyx
         std::make_tuple(data_types::f32, format::bfwzyx),
         std::make_tuple(data_types::f16, format::bfwzyx),
diff --git a/inference-engine/thirdparty/clDNN/src/impls/ocl/concatenation.cpp b/inference-engine/thirdparty/clDNN/src/impls/ocl/concatenation.cpp
index d422df6c640..3897185b3cd 100644
--- a/inference-engine/thirdparty/clDNN/src/impls/ocl/concatenation.cpp
+++ b/inference-engine/thirdparty/clDNN/src/impls/ocl/concatenation.cpp
@@ -134,6 +134,21 @@ attach_concatenation_impl::attach_concatenation_impl() {
         std::make_tuple(data_types::u8, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::i32, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::i64, format::bs_fs_zyx_bsv16_fsv16),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i32, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i64, format::bs_fs_yx_bsv32_fsv32),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i32, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i64, format::bs_fs_yx_bsv32_fsv16),
+
         std::make_tuple(data_types::f32, format::bs_fs_yx_bsv16_fsv16),
         std::make_tuple(data_types::f16, format::bs_fs_yx_bsv16_fsv16),
         std::make_tuple(data_types::f16, format::b_fs_yx_fsv16),
diff --git a/inference-engine/thirdparty/clDNN/src/impls/ocl/convolution.cpp b/inference-engine/thirdparty/clDNN/src/impls/ocl/convolution.cpp
index 9a6b514f9bc..03d157483e3 100644
--- a/inference-engine/thirdparty/clDNN/src/impls/ocl/convolution.cpp
+++ b/inference-engine/thirdparty/clDNN/src/impls/ocl/convolution.cpp
@@ -195,10 +195,31 @@ attach_convolution_impl::attach_convolution_impl() {
         std::make_tuple(data_types::f16, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::f32, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::f16, format::bs_fs_zyx_bsv16_fsv16),
+
         std::make_tuple(data_types::f32, format::bs_fs_yx_bsv16_fsv16),
         std::make_tuple(data_types::f16, format::bs_fs_yx_bsv16_fsv16),
         std::make_tuple(data_types::u8, format::bs_fs_yx_bsv16_fsv16),
         std::make_tuple(data_types::i8, format::bs_fs_yx_bsv16_fsv16),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv32),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv16),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv4_fsv4),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv4_fsv4),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv4_fsv4),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv4_fsv4),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv4_fsv2),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv4_fsv2),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv4_fsv2),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv4_fsv2),
     });
 }
 
diff --git a/inference-engine/thirdparty/clDNN/src/impls/ocl/eltwise.cpp b/inference-engine/thirdparty/clDNN/src/impls/ocl/eltwise.cpp
index 8b3242da0b6..4df57b30d16 100644
--- a/inference-engine/thirdparty/clDNN/src/impls/ocl/eltwise.cpp
+++ b/inference-engine/thirdparty/clDNN/src/impls/ocl/eltwise.cpp
@@ -124,62 +124,102 @@ namespace detail {
 attach_eltwise_impl::attach_eltwise_impl() {
     implementation_map<eltwise>::add(impl_types::ocl, eltwise_impl::create, {
         std::make_tuple(data_types::f32, format::yxfb),
-        std::make_tuple(data_types::u8, format::bfyx),
         std::make_tuple(data_types::f16, format::yxfb),
         std::make_tuple(data_types::i8, format::yxfb),
         std::make_tuple(data_types::i32, format::yxfb),
         std::make_tuple(data_types::i64, format::yxfb),
+
         std::make_tuple(data_types::f32, format::bfyx),
         std::make_tuple(data_types::f16, format::bfyx),
+        std::make_tuple(data_types::u8, format::bfyx),
         std::make_tuple(data_types::i8, format::bfyx),
         std::make_tuple(data_types::i32, format::bfyx),
         std::make_tuple(data_types::i64, format::bfyx),
+
         std::make_tuple(data_types::f32, format::byxf),
         std::make_tuple(data_types::f16, format::byxf),
         std::make_tuple(data_types::i8, format::byxf),
         std::make_tuple(data_types::i32, format::byxf),
         std::make_tuple(data_types::i64, format::byxf),
+
         std::make_tuple(data_types::f16, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::f32, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::i8, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::u8, format::b_fs_yx_fsv16),
+
         std::make_tuple(data_types::f32, format::bfzyx),
         std::make_tuple(data_types::f16, format::bfzyx),
         std::make_tuple(data_types::i8, format::bfzyx),
         std::make_tuple(data_types::u8, format::bfzyx),
         std::make_tuple(data_types::i32, format::bfzyx),
         std::make_tuple(data_types::i64, format::bfzyx),
+
         std::make_tuple(data_types::f32, format::bfwzyx),
         std::make_tuple(data_types::f16, format::bfwzyx),
         std::make_tuple(data_types::i8, format::bfwzyx),
         std::make_tuple(data_types::u8, format::bfwzyx),
         std::make_tuple(data_types::i32, format::bfwzyx),
         std::make_tuple(data_types::i64, format::bfwzyx),
+
         std::make_tuple(data_types::f32, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::f16, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::i8, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::u8, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::i32, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::i64, format::b_fs_zyx_fsv16),
+
         std::make_tuple(data_types::f32, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::f16, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::i8, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::i32, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::i64, format::bs_fs_zyx_bsv16_fsv16),
+
         std::make_tuple(data_types::f32, format::bs_fs_yx_bsv16_fsv16),
         std::make_tuple(data_types::f16, format::bs_fs_yx_bsv16_fsv16),
+
         std::make_tuple(data_types::i8, format::b_fs_yx_fsv4),
         std::make_tuple(data_types::u8, format::b_fs_yx_fsv4),
         std::make_tuple(data_types::f32, format::b_fs_yx_fsv4),
+
         std::make_tuple(data_types::i8, format::b_fs_yx_fsv32),
         std::make_tuple(data_types::u8, format::b_fs_yx_fsv32),
         std::make_tuple(data_types::f32, format::b_fs_yx_fsv32),
         std::make_tuple(data_types::f16, format::b_fs_yx_fsv32),
+
         std::make_tuple(data_types::i8, format::b_fs_zyx_fsv32),
         std::make_tuple(data_types::u8, format::b_fs_zyx_fsv32),
         std::make_tuple(data_types::f32, format::b_fs_zyx_fsv32),
         std::make_tuple(data_types::f16, format::b_fs_zyx_fsv32),
+
         std::make_tuple(data_types::f16, format::fs_b_yx_fsv32),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i32, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i64, format::bs_fs_yx_bsv32_fsv32),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i32, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i64, format::bs_fs_yx_bsv32_fsv16),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv4_fsv4),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv4_fsv4),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv4_fsv4),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv4_fsv4),
+        std::make_tuple(data_types::i32, format::bs_fs_yx_bsv4_fsv4),
+        std::make_tuple(data_types::i64, format::bs_fs_yx_bsv4_fsv4),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv4_fsv2),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv4_fsv2),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv4_fsv2),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv4_fsv2),
+        std::make_tuple(data_types::i32, format::bs_fs_yx_bsv4_fsv2),
+        std::make_tuple(data_types::i64, format::bs_fs_yx_bsv4_fsv2),
     });
 }
 
diff --git a/inference-engine/thirdparty/clDNN/src/impls/ocl/lrn.cpp b/inference-engine/thirdparty/clDNN/src/impls/ocl/lrn.cpp
index 9edbd978be6..947182d1fde 100644
--- a/inference-engine/thirdparty/clDNN/src/impls/ocl/lrn.cpp
+++ b/inference-engine/thirdparty/clDNN/src/impls/ocl/lrn.cpp
@@ -58,22 +58,41 @@ attach_lrn_impl::attach_lrn_impl() {
         std::make_tuple(data_types::f16, format::yxfb),
         std::make_tuple(data_types::u8, format::yxfb),
         std::make_tuple(data_types::i8, format::yxfb),
+
         std::make_tuple(data_types::f32, format::bfyx),
         std::make_tuple(data_types::f16, format::bfyx),
         std::make_tuple(data_types::u8, format::bfyx),
         std::make_tuple(data_types::i8, format::bfyx),
+
         std::make_tuple(data_types::f32, format::byxf),
         std::make_tuple(data_types::f16, format::byxf),
         std::make_tuple(data_types::u8, format::byxf),
         std::make_tuple(data_types::i8, format::byxf),
+
         std::make_tuple(data_types::f32, format::b_fs_yx_fsv4),
         std::make_tuple(data_types::f16, format::b_fs_yx_fsv4),
         std::make_tuple(data_types::u8, format::b_fs_yx_fsv4),
         std::make_tuple(data_types::i8, format::b_fs_yx_fsv4),
+
         std::make_tuple(data_types::f32, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::f16, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::u8, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::i8, format::b_fs_yx_fsv16),
+
+        std::make_tuple(data_types::f32, format::b_fs_yx_fsv32),
+        std::make_tuple(data_types::f16, format::b_fs_yx_fsv32),
+        std::make_tuple(data_types::i8, format::b_fs_yx_fsv32),
+        std::make_tuple(data_types::u8, format::b_fs_yx_fsv32),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv32),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv16),
     });
 }
 
diff --git a/inference-engine/thirdparty/clDNN/src/impls/ocl/mvn.cpp b/inference-engine/thirdparty/clDNN/src/impls/ocl/mvn.cpp
index 3a04d5ecc6d..f4afaec8934 100644
--- a/inference-engine/thirdparty/clDNN/src/impls/ocl/mvn.cpp
+++ b/inference-engine/thirdparty/clDNN/src/impls/ocl/mvn.cpp
@@ -60,24 +60,35 @@ attach_mvn_impl::attach_mvn_impl() {
         std::make_tuple(data_types::f16, format::bfyx),
         std::make_tuple(data_types::u8, format::bfyx),
         std::make_tuple(data_types::i8, format::bfyx),
+
         std::make_tuple(data_types::f32, format::yxfb),
         std::make_tuple(data_types::f16, format::yxfb),
+
         std::make_tuple(data_types::f32, format::byxf),
         std::make_tuple(data_types::f16, format::byxf),
+
         std::make_tuple(data_types::f32, format::bfzyx),
         std::make_tuple(data_types::f16, format::bfzyx),
         std::make_tuple(data_types::u8, format::bfzyx),
         std::make_tuple(data_types::i8, format::bfzyx),
+
         std::make_tuple(data_types::f32, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::f16, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::u8, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::i8, format::b_fs_zyx_fsv16),
+
         std::make_tuple(data_types::f32, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::f16, format::bs_fs_zyx_bsv16_fsv16),
+
         std::make_tuple(data_types::f32, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::f16, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::u8, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::i8, format::b_fs_yx_fsv16),
+
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv32),
+
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv16),
     });
 }
 
diff --git a/inference-engine/thirdparty/clDNN/src/impls/ocl/pooling.cpp b/inference-engine/thirdparty/clDNN/src/impls/ocl/pooling.cpp
index 952adc3c8a5..cbc587991cd 100644
--- a/inference-engine/thirdparty/clDNN/src/impls/ocl/pooling.cpp
+++ b/inference-engine/thirdparty/clDNN/src/impls/ocl/pooling.cpp
@@ -162,48 +162,69 @@ attach_pooling_impl::attach_pooling_impl() {
         std::make_tuple(data_types::f16, format::bfyx),
         std::make_tuple(data_types::i8, format::bfyx),
         std::make_tuple(data_types::u8, format::bfyx),
+
         std::make_tuple(data_types::f32, format::yxfb),
         std::make_tuple(data_types::f16, format::yxfb),
         std::make_tuple(data_types::i8, format::yxfb),
         std::make_tuple(data_types::u8, format::yxfb),
+
         std::make_tuple(data_types::f32, format::byxf),
         std::make_tuple(data_types::f16, format::byxf),
         std::make_tuple(data_types::i8, format::byxf),
         std::make_tuple(data_types::u8, format::byxf),
+
         std::make_tuple(data_types::f16, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::f32, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::i8, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::u8, format::b_fs_yx_fsv16),
+
         std::make_tuple(data_types::f32, format::bs_fs_yx_bsv16_fsv16),
         std::make_tuple(data_types::f16, format::bs_fs_yx_bsv16_fsv16),
         std::make_tuple(data_types::i8, format::bs_fs_yx_bsv16_fsv16),
         std::make_tuple(data_types::u8, format::bs_fs_yx_bsv16_fsv16),
+
         std::make_tuple(data_types::f32, format::bfzyx),
         std::make_tuple(data_types::f16, format::bfzyx),
         std::make_tuple(data_types::i8, format::bfzyx),
         std::make_tuple(data_types::u8, format::bfzyx),
+
         std::make_tuple(data_types::f32, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::f16, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::i8, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::u8, format::b_fs_zyx_fsv16),
+
         std::make_tuple(data_types::f32, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::f16, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::i8, format::bs_fs_zyx_bsv16_fsv16),
         std::make_tuple(data_types::u8, format::bs_fs_zyx_bsv16_fsv16),
+
         std::make_tuple(data_types::f32, format::b_fs_yx_fsv4),
         std::make_tuple(data_types::f16, format::b_fs_yx_fsv4),
         std::make_tuple(data_types::i8, format::b_fs_yx_fsv4),
         std::make_tuple(data_types::u8, format::b_fs_yx_fsv4),
+
         std::make_tuple(data_types::i8, format::b_fs_yx_fsv32),
         std::make_tuple(data_types::u8, format::b_fs_yx_fsv32),
         std::make_tuple(data_types::f32, format::b_fs_yx_fsv32),
         std::make_tuple(data_types::f16, format::b_fs_yx_fsv32),
+
         std::make_tuple(data_types::i8, format::b_fs_zyx_fsv32),
         std::make_tuple(data_types::u8, format::b_fs_zyx_fsv32),
         std::make_tuple(data_types::f32, format::b_fs_zyx_fsv32),
         std::make_tuple(data_types::f16, format::b_fs_zyx_fsv32),
+
         std::make_tuple(data_types::f16, format::fs_b_yx_fsv32),
         std::make_tuple(data_types::f32, format::fs_b_yx_fsv32),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv32),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv16),
     });
 }
 
diff --git a/inference-engine/thirdparty/clDNN/src/impls/ocl/primitive_base.cpp b/inference-engine/thirdparty/clDNN/src/impls/ocl/primitive_base.cpp
deleted file mode 100644
index 63e1e8bd0bb..00000000000
--- a/inference-engine/thirdparty/clDNN/src/impls/ocl/primitive_base.cpp
+++ /dev/null
@@ -1,32 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include "primitive_base.hpp"
-#include <list>
-
-namespace cldnn {
-namespace ocl {
-
-bool is_user_cpu(const program_node* user) {
-    if (user->can_be_optimized()) {
-        auto users = user->get_users();
-        for (const auto& u : users) {
-            if (is_user_cpu(u)) {
-                return true;
-            }
-        }
-        return false;
-    }
-    return user->get_selected_impl()->is_cpu();
-}
-
-bool is_any_user_cpu(const std::list<const program_node*>& users) {
-    for (const auto& user : users) {
-        if (is_user_cpu(user))
-            return true;
-    }
-    return false;
-}
-}  // namespace ocl
-}  // namespace cldnn
diff --git a/inference-engine/thirdparty/clDNN/src/impls/ocl/primitive_base.hpp b/inference-engine/thirdparty/clDNN/src/impls/ocl/primitive_base.hpp
index 4315156be13..1fcbccfabf3 100644
--- a/inference-engine/thirdparty/clDNN/src/impls/ocl/primitive_base.hpp
+++ b/inference-engine/thirdparty/clDNN/src/impls/ocl/primitive_base.hpp
@@ -9,6 +9,7 @@
 #include "primitive_inst.h"
 #include "cldnn/graph/program.hpp"
 #include "cldnn/runtime/error_handler.hpp"
+#include "cldnn/runtime/debug_configuration.hpp"
 #include "kernel_selector_helper.h"
 #include "cldnn/graph/network.hpp"
 #include "register.hpp"
@@ -19,9 +20,6 @@
 namespace cldnn {
 namespace ocl {
 
-// checks if any user in a list is a cpu primitive
-bool is_any_user_cpu(const std::list<const program_node*>& users);
-
 /*
 Base class for all GPU implementation of specified primitive type.
 For example, all gpu convolution implementations should derive from typed_primitive_impl_ocl<convolution>.
@@ -32,24 +30,17 @@ struct typed_primitive_impl_ocl : public typed_primitive_impl<PType> {
     kernel_selector::kernel_data _kernel_data;
     std::vector<kernel_id> _kernel_ids;
     std::vector<kernel::ptr> _kernels;
-    std::vector<memory::cptr> _intermediates_memory;
 
     typed_primitive_impl_ocl(const typed_primitive_impl_ocl<PType>& other)
     : typed_primitive_impl<PType>(other._weights_reorder_params, other._kernel_name)
     , _outer(other._outer)
     , _kernel_data(other._kernel_data)
     , _kernel_ids(other._kernel_ids)
-    , _kernels({})
-    , _intermediates_memory({}) {
+    , _kernels({}) {
         _kernels.reserve(other._kernels.size());
         for (size_t k = 0; k < other._kernels.size(); ++k) {
             _kernels.emplace_back(other._kernels[k]->clone());
         }
-        for (auto& mem : other._intermediates_memory) {
-            auto& engine = _outer.get_program().get_engine();
-            auto new_mem = engine.allocate_memory(mem->get_layout(), mem->get_allocation_type());
-            _intermediates_memory.push_back(new_mem);
-        }
     }
 
     typed_primitive_impl_ocl(const typed_program_node<PType>& arg, const kernel_selector::kernel_data& kd)
@@ -66,18 +57,8 @@ struct typed_primitive_impl_ocl : public typed_primitive_impl<PType> {
         for (size_t i = 0; i < kd.kernels.size(); ++i) {
             _kernel_ids.emplace_back(_outer.get_program().add_kernel(kd.kernels[i].code.kernelString));
         }
-
-        for (auto size : kd.internalBufferSizes) {
-            auto dtype = from_data_type(kd.internalBufferDataType);
-            const auto bpp = data_type_traits::size_of(dtype);
-            layout expected_layout = {dtype,
-                                      format::bfyx,  // simple linear format (flatten to x channel)
-                                      {1, 1, 1, (tensor::value_type)(size / bpp)}};
-
-            auto& eimpl = arg.get_program().get_engine();
-            _intermediates_memory.push_back(eimpl.allocate_memory(expected_layout));
-        }
     }
+
     bool is_cpu() const override { return false; }
 
 protected:
@@ -128,6 +109,21 @@ protected:
         }
     }
 
+    std::vector<layout> get_internal_buffer_layouts_impl() const override {
+        if (_kernel_data.internalBufferSizes.empty())
+            return {};
+
+        std::vector<layout> layouts;
+        auto dtype = from_data_type(_kernel_data.internalBufferDataType);
+        const auto bpp = data_type_traits::size_of(dtype);
+        for (auto size : _kernel_data.internalBufferSizes) {
+            layout inbuf_layout = {dtype, format::bfyx, // simple linear format (flattern to x channel)
+                                    {1, 1, 1, (tensor::value_type)(size / bpp)}};
+            layouts.push_back(inbuf_layout);
+        }
+        return layouts;
+    }
+
     void set_arguments_impl(typed_primitive_inst<PType>& instance) override {
         if (optimized_out(instance) || is_cpu()) {
             return;
@@ -144,7 +140,7 @@ protected:
                 args.scalars = &_kernel_data.kernels[k].params.scalars;
                 args.split = i;
 
-                for (const auto& m : _intermediates_memory) {
+                for (const auto& m : instance.get_intermediates_memories()) {
                     args.intermediates.push_back(m);
                 }
 
@@ -179,7 +175,7 @@ protected:
                 args.scalars = &_kernel_data.kernels[k].params.scalars;
                 args.split = i;
 
-                for (const auto& m : _intermediates_memory) {
+                for (const auto& m : instance.get_intermediates_memories()) {
                     args.intermediates.push_back(m);
                 }
 
diff --git a/inference-engine/thirdparty/clDNN/src/impls/ocl/quantize.cpp b/inference-engine/thirdparty/clDNN/src/impls/ocl/quantize.cpp
index c90d744b1de..80b74c3955e 100644
--- a/inference-engine/thirdparty/clDNN/src/impls/ocl/quantize.cpp
+++ b/inference-engine/thirdparty/clDNN/src/impls/ocl/quantize.cpp
@@ -149,9 +149,16 @@ attach_quantize_impl::attach_quantize_impl() {
         std::make_tuple(data_types::i8, format::bfwzyx),
         std::make_tuple(data_types::f32, format::b_fs_zyx_fsv16),
         std::make_tuple(data_types::f16, format::b_fs_zyx_fsv16),
-        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv16_fsv16),
-        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv16_fsv16),
-        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv16_fsv16),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv32),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv16),
     });
 }
 
diff --git a/inference-engine/thirdparty/clDNN/src/impls/ocl/resample.cpp b/inference-engine/thirdparty/clDNN/src/impls/ocl/resample.cpp
index d84f4d5a853..c5871c0ff0a 100644
--- a/inference-engine/thirdparty/clDNN/src/impls/ocl/resample.cpp
+++ b/inference-engine/thirdparty/clDNN/src/impls/ocl/resample.cpp
@@ -147,25 +147,46 @@ attach_resample_impl::attach_resample_impl() {
     implementation_map<resample>::add(impl_types::ocl, resample_impl::create, {
         std::make_tuple(data_types::f32, format::yxfb),
         std::make_tuple(data_types::f16, format::yxfb),
-        std::make_tuple(data_types::f32, format::bfyx),
-        std::make_tuple(data_types::f16, format::bfyx),
-        std::make_tuple(data_types::f16, format::fs_b_yx_fsv32),
-        std::make_tuple(data_types::f16, format::b_fs_yx_fsv16),
-        std::make_tuple(data_types::f32, format::b_fs_yx_fsv16),
+
         std::make_tuple(data_types::f32, format::byxf),
         std::make_tuple(data_types::f16, format::byxf),
-        std::make_tuple(data_types::f32, format::bfzyx),
-        std::make_tuple(data_types::f16, format::bfzyx),
+
+        std::make_tuple(data_types::f32, format::bfyx),
+        std::make_tuple(data_types::f16, format::bfyx),
         std::make_tuple(data_types::u8, format::bfyx),
         std::make_tuple(data_types::i8, format::bfyx),
+
+        std::make_tuple(data_types::f32, format::bfzyx),
+        std::make_tuple(data_types::f16, format::bfzyx),
         std::make_tuple(data_types::u8, format::bfzyx),
         std::make_tuple(data_types::i8, format::bfzyx),
+
+        std::make_tuple(data_types::f16, format::fs_b_yx_fsv32),
+
+        std::make_tuple(data_types::f32, format::b_fs_yx_fsv16),
+        std::make_tuple(data_types::f16, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::u8, format::b_fs_yx_fsv16),
         std::make_tuple(data_types::i8, format::b_fs_yx_fsv16),
+
         std::make_tuple(data_types::f32, format::b_fs_yx_fsv4),
         std::make_tuple(data_types::f16, format::b_fs_yx_fsv4),
         std::make_tuple(data_types::u8, format::b_fs_yx_fsv4),
         std::make_tuple(data_types::i8, format::b_fs_yx_fsv4),
+
+        std::make_tuple(data_types::f32, format::b_fs_yx_fsv32),
+        std::make_tuple(data_types::f16, format::b_fs_yx_fsv32),
+        std::make_tuple(data_types::u8, format::b_fs_yx_fsv32),
+        std::make_tuple(data_types::i8, format::b_fs_yx_fsv32),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv32),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv32),
+
+        std::make_tuple(data_types::f32, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::f16, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::u8, format::bs_fs_yx_bsv32_fsv16),
+        std::make_tuple(data_types::i8, format::bs_fs_yx_bsv32_fsv16),
     });
 }
 
diff --git a/inference-engine/thirdparty/clDNN/src/impls/onednn/convolution_onednn.cpp b/inference-engine/thirdparty/clDNN/src/impls/onednn/convolution_onednn.cpp
new file mode 100644
index 00000000000..579faf9208e
--- /dev/null
+++ b/inference-engine/thirdparty/clDNN/src/impls/onednn/convolution_onednn.cpp
@@ -0,0 +1,219 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "convolution_inst.h"
+#include "eltwise_inst.h"
+#include "quantize_inst.h"
+#include "primitive_onednn_base.h"
+#include "impls/implementation_map.hpp"
+
+#include "kernel_selector_common.h"
+
+#include <oneapi/dnnl/dnnl.hpp>
+
+#include <algorithm>
+#include <memory>
+namespace cldnn {
+namespace onednn {
+
+struct convolution_onednn : typed_primitive_onednn_impl<convolution, dnnl::convolution_forward::desc> {
+    using parent = typed_primitive_onednn_impl<convolution, dnnl::convolution_forward::desc>;
+    using parent::parent;
+
+protected:
+    std::unique_ptr<primitive_impl> clone() const override {
+        return make_unique<convolution_onednn>(*this);
+    }
+
+    bool validate_impl(const typed_primitive_inst<convolution>& instance) const override {
+        bool res = true;
+
+        auto outer_id = _outer.id();
+        auto data_type = instance.node.input().get_output_layout().data_type;
+
+        // Integer signed/unsigned is ok for convoluiton
+        CLDNN_ERROR_DATA_TYPES_MISMATCH_IGNORE_SIGN(outer_id,
+                                                    "Input memory",
+                                                    data_type,
+                                                    "filter memory",
+                                                    instance.weights_memory(0)->get_layout().data_type,
+                                                    "");
+
+        return res;
+    }
+
+    std::unordered_map<int, dnnl::memory> get_arguments(convolution_inst& instance) const override {
+        std::unordered_map<int, dnnl::memory> args = parent::get_arguments(instance);
+
+        {
+            auto weights = instance.weights_memory(0);
+            args.insert({DNNL_ARG_WEIGHTS, weights->get_onednn_memory(_pd.weights_desc(0))});
+        }
+
+        if (instance.bias_term()) {
+            auto bias = instance.bias_memory(0);
+            args.insert({DNNL_ARG_BIAS, bias->get_onednn_memory(_pd.weights_desc(1))});
+        }
+
+        if (has_zero_points(DNNL_ARG_SRC, _attrs)) {
+            auto a_zp = instance.activations_zero_points_memory(0);
+            dnnl::memory::desc desc = onednn::layout_to_memory_desc(a_zp->get_layout(), dnnl::memory::format_tag::a, true);
+            args.insert({DNNL_ARG_ATTR_ZERO_POINTS | DNNL_ARG_SRC, a_zp->get_onednn_memory(desc)});
+        }
+
+        if (has_zero_points(DNNL_ARG_WEIGHTS, _attrs)) {
+            auto w_zp = instance.weights_zero_points_memory(0);
+            dnnl::memory::desc desc = onednn::layout_to_memory_desc(w_zp->get_layout(), dnnl::memory::format_tag::a, true);
+            args.insert({DNNL_ARG_ATTR_ZERO_POINTS | DNNL_ARG_WEIGHTS, w_zp->get_onednn_memory(desc)});
+        }
+
+        return args;
+    }
+
+    static std::shared_ptr<dnnl::primitive_attr> get_primitive_attributes(const typed_program_node<convolution>& arg) {
+        auto attrs = parent::get_primitive_attributes(arg);
+
+        if (arg.activations_zero_points_term()) {
+            auto& a_zp = arg.activations_zero_points();
+
+            memory::ptr s32_mem;
+            if (a_zp.get_output_layout().data_type == data_types::i8) {
+                s32_mem = onednn::convert_zp_data_to_s32<data_type_to_type<data_types::i8>::type>(a_zp.as<data>().get_attached_memory_ptr());
+            } else if (a_zp.get_output_layout().data_type == data_types::u8) {
+                s32_mem = onednn::convert_zp_data_to_s32<data_type_to_type<data_types::u8>::type>(a_zp.as<data>().get_attached_memory_ptr());
+            } else {
+                throw std::runtime_error("Unsupported data type for activations zero points for oneDNN convolution");
+            }
+            a_zp.as<data>().attach_memory(s32_mem);
+
+            int mask = a_zp.get_output_layout().count() > 1 ? 2 : 0;
+
+            attrs->set_zero_points(DNNL_ARG_SRC, mask, {DNNL_RUNTIME_S32_VAL});
+        }
+
+        if (arg.weights_zero_points_term()) {
+            throw std::runtime_error("Convolution oneDNN primitive doesn't support asymmetric weights quantization");
+
+            // Commented out since oneDNN doesn't support asymmetric weights quantization
+            // auto& w_zp = arg.weights_zero_points();
+            // int mask = w_zp.get_output_layout().count() > 1 ? 2 : 0;
+            // attrs->set_zero_points(DNNL_ARG_WEIGHTS, mask, {DNNL_RUNTIME_S32_VAL});
+        }
+
+        return attrs;
+    }
+
+    static kernel_selector::WeightsReorderParams get_weights_reorder(const convolution_node& arg, const dnnl::primitive_desc& pd) {
+        kernel_selector::WeightsReorderParams weights_reorder_params;
+        auto& reorderKS = kernel_selector::ReorderWeightsKernelSelctor::Instance();
+        kernel_selector::reorder_weights_params r_params;
+
+        auto cldnn_prim = arg.get_primitive();
+        auto weights_layout = arg.get_dependency(1).get_output_layout();
+        auto grouped_weights = format::is_grouped(weights_layout.format) || arg.get_primitive()->grouped_weights_shape;
+        cldnn::format out_fmt = onednn::convert_format(onednn::get_format_by_desc(pd.weights_desc(0)), grouped_weights);
+        kernel_selector::WeightsLayout reqLayout = to_weights_layout(out_fmt, cldnn_prim->grouped_weights_shape);
+
+        set_params(arg, r_params);
+        r_params.layerID = arg.id() + "_reorder_";
+        r_params.input = convert_weights_tensor(weights_layout, cldnn_prim->grouped_weights_shape);
+        r_params.output = r_params.input.TransformIgnorePadding(reqLayout, r_params.input.GetDType(), arg.get_groups(), false);
+        r_params.rotate_180 = false;
+
+        kernel_selector::reorder_optional_params op;
+        kernel_selector::KernelsData kernels_data = reorderKS.GetBestKernels(r_params, op);
+
+        if (kernels_data.empty()) {
+            throw std::runtime_error("No suitable kernel found for weights reorder from " +
+                                        kernel_selector::toString(r_params.input.GetLayout()) + " to " +
+                                        kernel_selector::toString(r_params.output.GetLayout()));
+        }
+
+        weights_reorder_params.engine = kernel_selector::WeightsReorderParams::Engine::GPU;
+        weights_reorder_params.clKernel = std::make_shared<kernel_selector::clKernelData>(kernels_data[0].kernels[0]);
+        weights_reorder_params.dest = r_params.output;
+
+        return weights_reorder_params;
+    }
+
+    static std::shared_ptr<dnnl::convolution_forward::desc> get_convolution_descriptor(const convolution_node& arg) {
+        auto prim = arg.get_primitive();
+
+        auto& input = arg.get_dependency(0);
+        auto& weights = arg.get_dependency(1);
+        auto spatials_rank = cldnn::format::spatial_num(input.get_output_layout().format);
+
+        auto stride = onednn::convert_spatials(prim->stride, spatials_rank);
+        auto dilation = onednn::convert_spatials(prim->dilation, spatials_rank);
+        auto pad_l = onednn::convert_spatials(prim->input_offset, spatials_rank);
+        auto pad_r = onednn::convert_spatials(prim->input_offset, spatials_rank);
+
+        auto input_md = onednn::layout_to_memory_desc(input.get_output_layout());
+        auto weights_md = onednn::layout_to_memory_desc(weights.get_output_layout(), dnnl::memory::format_tag::any);
+        auto output_md = onednn::layout_to_memory_desc(arg.get_output_layout());
+        auto grouped_weights = format::is_grouped(weights.get_output_layout().format) || prim->grouped_weights_shape;
+
+        for (size_t i = 0; i < dilation.size(); i++) {
+            dilation[i]--;
+            pad_l[i] = -pad_l[i];
+            int weights_offset = (grouped_weights ? 3 : 2) + static_cast<int>(i);
+            auto os = output_md.dims()[2 + i];
+            auto is = input_md.dims()[2 + i];
+            auto ks = weights_md.dims()[weights_offset];
+            auto kernel_range = 1 + (ks - 1) * (dilation[i] + 1);
+            pad_r[i] = (os - 1) * stride[i] - is + kernel_range - pad_l[i];
+        }
+
+        if (arg.bias_term()) {
+            auto bias_md = onednn::layout_to_memory_desc(arg.get_dependency(2).get_output_layout(), dnnl::memory::format_tag::any, true);
+            return std::make_shared<dnnl::convolution_forward::desc>(
+                dnnl::prop_kind::forward_inference,
+                dnnl::algorithm::convolution_direct,
+                input_md,
+                weights_md,
+                bias_md,
+                output_md,
+                stride,
+                dilation,
+                pad_l,
+                pad_r);
+        } else {
+            return std::make_shared<dnnl::convolution_forward::desc>(
+                dnnl::prop_kind::forward_inference,
+                dnnl::algorithm::convolution_direct,
+                input_md,
+                weights_md,
+                output_md,
+                stride,
+                dilation,
+                pad_l,
+                pad_r);
+        }
+    }
+
+public:
+    static primitive_impl* create(const convolution_node& arg) {
+        auto& engine = arg.get_program().get_engine();
+        auto desc = get_convolution_descriptor(arg);
+        auto attr = get_primitive_attributes(arg);
+        dnnl::primitive_desc prim_desc{&desc->data, attr.get(), engine.get_onednn_engine(), nullptr};
+
+        return new convolution_onednn(arg, desc, attr, prim_desc, get_weights_reorder(arg, prim_desc));
+    }
+};
+
+namespace detail {
+
+attach_convolution_onednn::attach_convolution_onednn() {
+    implementation_map<convolution>::add(impl_types::onednn, convolution_onednn::create, {
+        std::make_tuple(data_types::f32, format::bfyx),
+        std::make_tuple(data_types::f16, format::bfyx),
+        std::make_tuple(data_types::u8, format::bfyx),
+        std::make_tuple(data_types::i8, format::bfyx),
+    });
+}
+
+}  // namespace detail
+}  // namespace onednn
+}  // namespace cldnn
diff --git a/inference-engine/thirdparty/clDNN/src/impls/onednn/primitive_onednn_base.h b/inference-engine/thirdparty/clDNN/src/impls/onednn/primitive_onednn_base.h
new file mode 100644
index 00000000000..c905c338c40
--- /dev/null
+++ b/inference-engine/thirdparty/clDNN/src/impls/onednn/primitive_onednn_base.h
@@ -0,0 +1,142 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "primitive_inst.h"
+#include "cldnn/runtime/error_handler.hpp"
+#include "cldnn/runtime/memory.hpp"
+#include "to_string_utils.h"
+#include "register.hpp"
+#include "utils.hpp"
+
+#include "quantize_inst.h"
+
+#include "reorder/reorder_weights_kernel_selector.h"
+#include "reorder/reorder_kernel_base.h"
+
+#include <vector>
+#include <list>
+#include <utility>
+
+#include <oneapi/dnnl/dnnl.hpp>
+
+namespace cldnn {
+namespace onednn {
+
+template <class PType, class DescType, class PrimDescType = dnnl::primitive_desc, class PrimType = dnnl::primitive>
+struct typed_primitive_onednn_impl : public typed_primitive_impl<PType> {
+    const typed_program_node<PType>& _outer;
+    std::shared_ptr<DescType> _desc;
+    std::shared_ptr<dnnl::primitive_attr> _attrs;
+    PrimDescType _pd;
+    PrimType _prim;
+    std::unordered_map<int, dnnl::memory> _args;
+
+    typed_primitive_onednn_impl(const typed_program_node<PType>& arg,
+                                std::shared_ptr<DescType> desc,
+                                std::shared_ptr<dnnl::primitive_attr> attrs,
+                                const PrimDescType& pd,
+                                kernel_selector::WeightsReorderParams weights_reorder = {})
+        : typed_primitive_impl<PType>(weights_reorder, pd.impl_info_str()),
+          _outer(arg),
+          _desc(desc),
+          _attrs(attrs),
+          _pd(pd),
+          _prim(pd) { }
+
+    bool is_cpu() const override { return false; }
+
+protected:
+    virtual bool optimized_out(typed_primitive_inst<PType>&) const { return false; }
+
+    static bool has_out_scales(const std::shared_ptr<dnnl::primitive_attr>& attr) {
+        int mask;
+        std::vector<float> scales;
+        attr->get_output_scales(mask, scales);
+        const auto drfv = reinterpret_cast<const int32_t&>(DNNL_RUNTIME_F32_VAL);
+        return !scales.empty() && (reinterpret_cast<const int32_t&>(scales[0]) == drfv);
+    }
+
+    static bool has_zero_points(int arg, const std::shared_ptr<dnnl::primitive_attr>& attr) {
+        int mask;
+        std::vector<int32_t> zp;
+        attr->get_zero_points(arg, mask, zp);
+        const auto drsv = reinterpret_cast<const int32_t&>(DNNL_RUNTIME_S32_VAL);
+        return !zp.empty() && (reinterpret_cast<const int32_t&>(zp[0]) == drsv);
+    }
+
+    virtual std::unordered_map<int, dnnl::memory> get_arguments(typed_primitive_inst<PType>& instance) const {
+        std::unordered_map<int, dnnl::memory> args;
+
+        for (size_t i = 0; i < instance.inputs_memory_count(); i++) {
+            auto& input = instance.input_memory(i);
+            args.insert({DNNL_ARG_SRC, input.get_onednn_memory(_pd.dnnl::primitive_desc_base::src_desc(static_cast<int>(i)))});
+        }
+
+        {
+            auto& output = instance.output_memory();
+            args.insert({DNNL_ARG_DST, output.get_onednn_memory(_pd.dnnl::primitive_desc_base::dst_desc(0))});
+        }
+
+        return args;
+    }
+
+    void init_kernels() override { }
+
+    static std::shared_ptr<dnnl::primitive_attr> get_primitive_attributes(const typed_program_node<PType>& /* arg */) {
+        auto attrs = std::make_shared<dnnl::primitive_attr>();
+        dnnl::post_ops post_ops;
+        attrs->set_post_ops(post_ops);
+
+        return attrs;
+    }
+
+    event::ptr aggregate_events(const std::vector<event::ptr>& events, stream& stream, bool group = false, bool is_output = false) const {
+        if (events.size() == 1 && !is_output)
+            return events[0];
+
+        if (group && !is_output)
+            return stream.group_events(events);
+
+        return stream.enqueue_marker(events, is_output);
+    }
+
+    void set_arguments_impl(typed_primitive_inst<PType>& instance) override {
+        _args = get_arguments(instance);
+    }
+
+    event::ptr execute_impl(const std::vector<event::ptr>& /* events */,
+                            typed_primitive_inst<PType>& instance) override {
+        auto& network = instance.get_network();
+        auto& engine = network.get_engine();
+        auto& stream = network.get_stream();
+        auto profiling = engine.configuration().enable_profiling;
+        event::ptr event;
+
+        if (profiling)
+            stream.finish();
+
+        _prim.execute(stream.get_onednn_stream(), _args);
+
+        if (profiling) {
+            // Measure all previously queued tasks
+            event = stream.enqueue_marker({}, true);
+            stream.wait_for_events({event});
+        } else {
+            // Create and set user event as complete
+            event = stream.create_user_event(true);
+        }
+
+        if (!event) {
+            std::string error_msg = "Event was not created properly for " + instance.id();
+            throw std::runtime_error(error_msg);
+        }
+
+        return event;
+    }
+};
+
+}  // namespace onednn
+}  // namespace cldnn
diff --git a/inference-engine/thirdparty/clDNN/src/impls/onednn/register.cpp b/inference-engine/thirdparty/clDNN/src/impls/onednn/register.cpp
new file mode 100644
index 00000000000..af9c898cacd
--- /dev/null
+++ b/inference-engine/thirdparty/clDNN/src/impls/onednn/register.cpp
@@ -0,0 +1,18 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "register.hpp"
+
+namespace cldnn {
+namespace onednn {
+
+#define REGISTER_ONEDNN_IMPL(prim)                       \
+    static detail::attach_##prim##_onednn attach_##prim
+
+void register_implementations() {
+    REGISTER_ONEDNN_IMPL(convolution);
+}
+
+}  // namespace onednn
+}  // namespace cldnn
diff --git a/inference-engine/thirdparty/clDNN/src/impls/onednn/register.hpp b/inference-engine/thirdparty/clDNN/src/impls/onednn/register.hpp
new file mode 100644
index 00000000000..cee12eaeeac
--- /dev/null
+++ b/inference-engine/thirdparty/clDNN/src/impls/onednn/register.hpp
@@ -0,0 +1,26 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "cldnn/primitives/convolution.hpp"
+
+namespace cldnn {
+namespace onednn {
+void register_implementations();
+
+namespace detail {
+
+#define REGISTER_ONEDNN_IMPL(prim)  \
+    struct attach_##prim##_onednn { \
+        attach_##prim##_onednn();   \
+    }
+
+REGISTER_ONEDNN_IMPL(convolution);
+
+#undef REGISTER_ONEDNN_IMPL
+
+}  // namespace detail
+}  // namespace onednn
+}  // namespace cldnn
diff --git a/inference-engine/thirdparty/clDNN/src/impls/onednn/utils.cpp b/inference-engine/thirdparty/clDNN/src/impls/onednn/utils.cpp
new file mode 100644
index 00000000000..a81a6799e60
--- /dev/null
+++ b/inference-engine/thirdparty/clDNN/src/impls/onednn/utils.cpp
@@ -0,0 +1,438 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "utils.hpp"
+#include <oneapi/dnnl/dnnl_debug.h>
+#include <oneapi/dnnl/dnnl_ocl.hpp>
+
+#include "to_string_utils.h"
+
+namespace cldnn {
+namespace onednn {
+
+template <typename T>
+cldnn::memory::ptr convert_zp_data_to_s32(const memory::ptr zp_memory) {
+    auto engine = zp_memory->get_engine();
+    auto& stream = engine->get_program_stream();
+
+    auto zp_s32_layout = zp_memory->get_layout();
+    zp_s32_layout.data_type = data_types::i32;
+    auto zp_s32_memory = engine->allocate_memory(zp_s32_layout, false);
+
+    mem_lock<T> zp_data(zp_memory, stream);
+    mem_lock<int32_t> zp_s32_data(zp_s32_memory, stream);
+    for (size_t i = 0; i < zp_data.size(); i++) {
+        zp_s32_data.data()[i] = static_cast<int32_t>(zp_data.data()[i]);
+    }
+
+    return zp_s32_memory;
+}
+
+template cldnn::memory::ptr convert_zp_data_to_s32<int8_t>(const memory::ptr zp_memory);
+template cldnn::memory::ptr convert_zp_data_to_s32<uint8_t>(const memory::ptr zp_memory);
+
+cldnn::format default_fmt_for_dims(size_t dims, bool is_grouped) {
+    switch (dims) {
+    case 6: return is_grouped ? cldnn::format::goizyx : cldnn::format::bfwzyx;
+    case 5: return is_grouped ? cldnn::format::goiyx : cldnn::format::bfzyx;
+    default: return cldnn::format::bfyx;
+    }
+}
+
+dnnl::memory::dims convert_tensor(cldnn::tensor t, size_t dims, bool is_grouped) {
+    auto sizes = t.sizes(default_fmt_for_dims(dims, is_grouped));
+    dnnl::memory::dims res(sizes.begin(), sizes.end());
+    return res;
+}
+
+dnnl::memory::dims convert_spatials(cldnn::tensor t, size_t dims) {
+    auto spatials = t.spatial;
+    dnnl::memory::dims res(dims);
+    for (size_t i = 0; i < dims; i++) {
+        res[i] = spatials[dims - i - 1];
+    }
+    return res;
+}
+
+dnnl::memory::dims flatten_tensor(cldnn::tensor t) {
+    return {static_cast<int64_t>(t.count())};
+}
+
+void pad_dims(dnnl::memory::dims& padded_dims, cldnn::format format) {
+    auto block_sizes = format.block_sizes();
+    for (auto& block : block_sizes) {
+        auto rounded_dim = round_up_to(padded_dims[block.first], block.second);
+        padded_dims[block.first] = rounded_dim;
+    }
+}
+
+dnnl::memory::data_type convert_data_type(cldnn::data_types dt) {
+    switch (dt) {
+        case cldnn::data_types::f32: return dnnl::memory::data_type::f32;
+        case cldnn::data_types::f16: return dnnl::memory::data_type::f16;
+        case cldnn::data_types::i8: return dnnl::memory::data_type::s8;
+        case cldnn::data_types::u8: return dnnl::memory::data_type::u8;
+        case cldnn::data_types::i32: return dnnl::memory::data_type::s32;
+        default: throw std::invalid_argument("[clDNN] Unsupported conversion from cldnn to ondnn type");
+    }
+}
+
+dnnl::memory::format_tag convert_data_format(cldnn::format fmt) {
+    switch (fmt) {
+        case cldnn::format::bfyx: return dnnl::memory::format_tag::nchw;
+        case cldnn::format::bfzyx: return dnnl::memory::format_tag::ncdhw;
+        case cldnn::format::byxf: return dnnl::memory::format_tag::nhwc;
+        // case cldnn::format::b_fs_yx_fsv16: return dnnl::memory::format_tag::nChw16c;
+        // case cldnn::format::b_fs_yx_fsv32: return dnnl::memory::format_tag::aBcd32b;
+        // case cldnn::format::b_fs_zyx_fsv16: return dnnl::memory::format_tag::nCdhw16c;
+        // case cldnn::format::b_fs_zyx_fsv32: return dnnl::memory::format_tag::aBcde32b;
+        // case cldnn::format::bs_fs_yx_bsv16_fsv16: return dnnl::memory::format_tag::NChw16n16c;
+        // case cldnn::format::bs_fs_yx_bsv32_fsv32: return dnnl::memory::format_tag::NChw32n32c;
+        // case cldnn::format::bs_fs_yx_bsv4_fsv4: return dnnl::memory::format_tag::ABcd4a4b;
+        // case cldnn::format::bs_fs_yx_bsv4_fsv2: return dnnl::memory::format_tag::ABcd4a2b;
+        // case cldnn::format::bs_fs_yx_bsv32_fsv16: return dnnl::memory::format_tag::NChw32n16c;
+        // case cldnn::format::bs_fs_zyx_bsv16_fsv16: return dnnl::memory::format_tag::NCdhw16n16c;
+        default: throw std::invalid_argument("[clDNN] Unsupported conversion from cldnn to ondnn layout " + fmt_to_str(fmt));
+    }
+}
+
+dnnl::memory::desc layout_to_memory_desc(cldnn::layout l, dnnl::memory::format_tag target_fmt, bool flatten) {
+    size_t rank = cldnn::format::dimension(l.format);
+    dnnl::memory::dims dims;
+    dnnl::memory::dims padded_dims;
+    dnnl::memory::dims padded_offset;
+    if (target_fmt == dnnl::memory::format_tag::ab && flatten) {
+        dims = flatten_tensor(l.size);
+        dims.insert(dims.begin(), 1);
+        padded_dims = dims;
+    } else if (target_fmt == dnnl::memory::format_tag::ab) {
+        dims.push_back(l.size.batch[0]);
+        dims.push_back(l.size.count() / l.size.batch[0]);
+        padded_dims = dims;
+    } else if (flatten) {
+        dims = flatten_tensor(l.size);
+        padded_dims = dims;
+    } else {
+        auto padded_size = l.size + l.data_padding.lower_size() + l.data_padding.upper_size();
+        auto offset = l.data_padding.lower_size();
+        dims = convert_tensor(l.size, rank, cldnn::format::is_grouped(l.format));
+        padded_dims = convert_tensor(padded_size, rank);
+        padded_offset = convert_tensor(offset, rank);
+    }
+
+    pad_dims(padded_dims, l.format);
+
+    dnnl::memory::data_type dt = convert_data_type(l.data_type);
+    dnnl::memory::format_tag fmt = target_fmt == dnnl::memory::format_tag::undef ? convert_data_format(l.format) : target_fmt;
+
+    dnnl::memory::desc res(dims, dt, fmt);
+
+    std::copy(padded_dims.begin(), padded_dims.end(), res.data.padded_dims);
+    std::copy(padded_offset.begin(), padded_offset.end(), res.data.padded_offsets);
+
+    return res;
+}
+
+static const std::map<int, std::vector<dnnl::memory::format_tag>> form_tags_by_ndims {
+    {0, {
+        dnnl::memory::format_tag::a   // TODO :: really 1d layout for scalar??
+     }}, {1, {
+        dnnl::memory::format_tag::a
+     }}, {2, {
+        dnnl::memory::format_tag::ab,
+        dnnl::memory::format_tag::ba
+     }}, {3, {
+        dnnl::memory::format_tag::abc,
+        dnnl::memory::format_tag::acb,
+        dnnl::memory::format_tag::bac,
+        dnnl::memory::format_tag::bca,
+        dnnl::memory::format_tag::cba,
+
+        dnnl::memory::format_tag::Abc16a,
+        dnnl::memory::format_tag::ABc16a16b,
+        dnnl::memory::format_tag::ABc4a4b,
+        dnnl::memory::format_tag::aBc16b,
+        dnnl::memory::format_tag::aBc32b,
+        dnnl::memory::format_tag::ABc16b16a,
+        dnnl::memory::format_tag::Abc4a,
+        dnnl::memory::format_tag::aBc4b,
+        dnnl::memory::format_tag::ABc4b16a4b,
+        dnnl::memory::format_tag::ABc2b8a4b,
+        dnnl::memory::format_tag::ABc16b16a4b,
+        dnnl::memory::format_tag::ABc16b16a2b,
+        dnnl::memory::format_tag::ABc4b4a,
+        dnnl::memory::format_tag::ABc8a16b2a,
+        dnnl::memory::format_tag::ABc8a8b,
+        dnnl::memory::format_tag::ABc8a4b,
+        dnnl::memory::format_tag::aBc8b,
+        dnnl::memory::format_tag::ABc8b16a2b,
+        dnnl::memory::format_tag::ABc8b8a,
+        // dnnl::memory::format_tag::ABc8a2b,
+        dnnl::memory::format_tag::Acb16a,
+        dnnl::memory::format_tag::Acb4a,
+        dnnl::memory::format_tag::Acb8a,
+        dnnl::memory::format_tag::BAc16a16b,
+        dnnl::memory::format_tag::BAc16b16a,
+     }}, {4, {                                 // Popular
+        dnnl::memory::format_tag::abcd,      // plain
+        dnnl::memory::format_tag::acdb,      // tail_c
+        dnnl::memory::format_tag::aBcd8b,    // blocked 8c
+        dnnl::memory::format_tag::aBcd16b,   // blocked 16c
+
+        dnnl::memory::format_tag::abdc,
+
+        dnnl::memory::format_tag::bacd,
+        dnnl::memory::format_tag::bcda,
+        dnnl::memory::format_tag::cdba,
+        dnnl::memory::format_tag::dcab,
+
+        dnnl::memory::format_tag::Abcd8a,
+        dnnl::memory::format_tag::Abcd16a,
+        dnnl::memory::format_tag::Abcd32a,
+        dnnl::memory::format_tag::ABcd16a16b,
+        dnnl::memory::format_tag::aBcd32b,
+        dnnl::memory::format_tag::ABcd16b16a,
+        dnnl::memory::format_tag::aBCd16b16c,
+        dnnl::memory::format_tag::aBCd16c16b,
+        dnnl::memory::format_tag::Abcd4a,
+        dnnl::memory::format_tag::aBcd4b,
+        dnnl::memory::format_tag::ABcd4b16a4b,
+        dnnl::memory::format_tag::ABcd2b8a4b,
+        dnnl::memory::format_tag::ABcd4b4a,
+        // dnnl::memory::format_tag::ABcd8a2b,
+        dnnl::memory::format_tag::ABcd4a4b,
+        dnnl::memory::format_tag::aBCd4c16b4c,
+        dnnl::memory::format_tag::aBCd2c8b4c,
+        dnnl::memory::format_tag::ABcd16b16a4b,
+        dnnl::memory::format_tag::ABcd16b16a2b,
+        dnnl::memory::format_tag::aBCd16c16b4c,
+        dnnl::memory::format_tag::aBCd16c16b2c,
+        dnnl::memory::format_tag::aBCd4c4b,
+        dnnl::memory::format_tag::aBCd4b4c,
+        dnnl::memory::format_tag::ABcd8a16b2a,
+        dnnl::memory::format_tag::ABcd8a8b,
+        dnnl::memory::format_tag::ABcd32a32b,
+        dnnl::memory::format_tag::ABcd8a4b,
+
+        dnnl::memory::format_tag::ABcd8b16a2b,
+        dnnl::memory::format_tag::aBCd8b16c2b,
+        dnnl::memory::format_tag::ABcd8b8a,
+        dnnl::memory::format_tag::aBCd8b8c,
+        dnnl::memory::format_tag::aBCd8b4c,
+        dnnl::memory::format_tag::aBCd8c16b2c,
+        dnnl::memory::format_tag::aBCd8c8b,
+
+        dnnl::memory::format_tag::ABcd4a8b8a4b,
+        // dnnl::memory::format_tag::ABcd4a8b8a2b,
+        dnnl::memory::format_tag::ABcd2a8b8a2b,
+
+        dnnl::memory::format_tag::aBdc16b,
+        dnnl::memory::format_tag::aBdc4b,
+        dnnl::memory::format_tag::aBdc8b,
+        dnnl::memory::format_tag::aCBd16b16c,
+        dnnl::memory::format_tag::aCBd16c16b,
+        dnnl::memory::format_tag::Acdb16a,
+        dnnl::memory::format_tag::Acdb4a,
+        dnnl::memory::format_tag::Acdb8a,
+        dnnl::memory::format_tag::BAcd16a16b,
+        dnnl::memory::format_tag::BAcd16b16a,
+        dnnl::memory::format_tag::ABcd32a32b,
+        dnnl::memory::format_tag::Acdb32a,
+        dnnl::memory::format_tag::aBCd2b4c2b,
+        dnnl::memory::format_tag::aBCd2c4b2c,
+        dnnl::memory::format_tag::aBCd4b8c2b,
+        dnnl::memory::format_tag::aBCd4c8b2c,
+    }}, {5, {                                   // Popular
+        dnnl::memory::format_tag::abcde,      // plain
+        dnnl::memory::format_tag::acdeb,      // tail_c
+        dnnl::memory::format_tag::aBcde8b,    // blocked 8c
+        dnnl::memory::format_tag::aBcde16b,   // blocked 16c
+
+        dnnl::memory::format_tag::abdec,
+        dnnl::memory::format_tag::acbde,
+        dnnl::memory::format_tag::bacde,
+        dnnl::memory::format_tag::bcdea,
+        dnnl::memory::format_tag::cdeba,
+        dnnl::memory::format_tag::decab,
+
+        dnnl::memory::format_tag::Abcde16a,
+        dnnl::memory::format_tag::Abcde32a,
+        dnnl::memory::format_tag::ABcde16a16b,
+        dnnl::memory::format_tag::aBcde32b,
+        dnnl::memory::format_tag::ABcde16b16a,
+        dnnl::memory::format_tag::aBCde16b16c,
+        dnnl::memory::format_tag::aBCde16c16b,
+        dnnl::memory::format_tag::aBCde2c8b4c,
+        dnnl::memory::format_tag::Abcde4a,
+        dnnl::memory::format_tag::aBcde4b,
+        dnnl::memory::format_tag::ABcde4b4a,
+        dnnl::memory::format_tag::ABcde4a4b,
+        dnnl::memory::format_tag::aBCde4b4c,
+        dnnl::memory::format_tag::aBCde4c16b4c,
+        dnnl::memory::format_tag::aBCde16c16b4c,
+        dnnl::memory::format_tag::aBCde16c16b2c,
+        dnnl::memory::format_tag::aBCde4c4b,
+        dnnl::memory::format_tag::Abcde8a,
+        dnnl::memory::format_tag::ABcde8a8b,
+        dnnl::memory::format_tag::ABcde8a4b,
+        dnnl::memory::format_tag::ABcde8b16a2b,
+        dnnl::memory::format_tag::ABcde4b16a4b,
+        dnnl::memory::format_tag::ABcde2b8a4b,
+        dnnl::memory::format_tag::aBCde8b16c2b,
+        dnnl::memory::format_tag::ABcde8b8a,
+        dnnl::memory::format_tag::aBCde8b8c,
+        dnnl::memory::format_tag::aBCde8b4c,
+        dnnl::memory::format_tag::aBCde4b8c8b4c,
+        // dnnl::memory::format_tag::aBCde4b8c8b2c,
+        dnnl::memory::format_tag::aBCde2b8c8b2c,
+        dnnl::memory::format_tag::aBCde8c16b2c,
+        dnnl::memory::format_tag::aBCde8c8b,
+        dnnl::memory::format_tag::aBdec16b,
+        dnnl::memory::format_tag::aBdec4b,
+        dnnl::memory::format_tag::aBdec8b,
+        dnnl::memory::format_tag::aCBde16b16c,
+        dnnl::memory::format_tag::aCBde16c16b,
+        dnnl::memory::format_tag::Acdeb16a,
+        dnnl::memory::format_tag::Acdeb4a,
+        dnnl::memory::format_tag::Acdeb8a,
+        dnnl::memory::format_tag::BAcde16b16a,
+        dnnl::memory::format_tag::BAcde16a16b,
+        dnnl::memory::format_tag::aBdec32b,
+        dnnl::memory::format_tag::aBCde2b4c2b,
+        dnnl::memory::format_tag::aBCde2c4b2c,
+        dnnl::memory::format_tag::aBCde4b8c2b,
+        dnnl::memory::format_tag::aBCde4c8b2c,
+    }}, {6, {                                    // Popular
+        dnnl::memory::format_tag::abcdef,      // plain
+        dnnl::memory::format_tag::acbdef,      // permuted
+        dnnl::memory::format_tag::defcab,      // permuted
+        dnnl::memory::format_tag::aBcdef16b,   // blocked 16c
+
+        dnnl::memory::format_tag::aBCdef16b16c,
+        dnnl::memory::format_tag::aBCdef16c16b,
+        dnnl::memory::format_tag::aBcdef4b,
+        dnnl::memory::format_tag::aBCdef2c8b4c,
+        dnnl::memory::format_tag::aBCdef4c4b,
+        dnnl::memory::format_tag::aBCdef4b4c,
+        dnnl::memory::format_tag::aBCdef8b8c,
+        dnnl::memory::format_tag::aBCdef8b4c,
+        dnnl::memory::format_tag::aBCdef8c16b2c,
+        dnnl::memory::format_tag::aBCdef4c16b4c,
+        dnnl::memory::format_tag::aBCdef8c8b,
+
+        dnnl::memory::format_tag::aBdefc16b,
+        dnnl::memory::format_tag::aCBdef16c16b,
+        dnnl::memory::format_tag::aCBdef16b16c,
+        dnnl::memory::format_tag::aBdefc4b,
+        dnnl::memory::format_tag::aBdefc8b,
+
+        dnnl::memory::format_tag::Abcdef16a,
+        dnnl::memory::format_tag::Abcdef32a,
+        dnnl::memory::format_tag::aBCdef2b4c2b,
+        dnnl::memory::format_tag::aBCdef2c4b2c,
+        dnnl::memory::format_tag::aBCdef4b8c2b,
+        dnnl::memory::format_tag::aBCdef4c8b2c,
+        }}
+};
+
+
+static bool isSame(dnnl::memory::desc desc, dnnl::memory::format_tag fmt) {
+    dnnl::memory::desc refDesc(desc.dims(), desc.data_type(), fmt);
+
+    if (desc.data.ndims != refDesc.data.ndims)
+        return false;
+
+    if (desc.data.format_kind != dnnl_blocked || refDesc.data.format_kind != dnnl_blocked)
+        throw std::runtime_error("dnnlMemoryDesc::isSame is not implemented for non blocked memory format");
+
+    auto actualBlkDesc = desc.data.format_desc.blocking;
+    auto refBlkDesc = refDesc.data.format_desc.blocking;
+    if (actualBlkDesc.inner_nblks != refBlkDesc.inner_nblks)
+        return false;
+
+    for (int i = 0; i < actualBlkDesc.inner_nblks; ++i)
+        if (actualBlkDesc.inner_blks[i] != refBlkDesc.inner_blks[i])
+            return false;
+
+    for (int i = 0; i < actualBlkDesc.inner_nblks; ++i)
+        if (actualBlkDesc.inner_idxs[i] != refBlkDesc.inner_idxs[i])
+            return false;
+
+    auto actualStrides = desc.data.format_desc.blocking.strides;
+    auto refStrides = refDesc.data.format_desc.blocking.strides;
+
+    std::vector<size_t> actualOrder(desc.data.ndims);
+    std::iota(actualOrder.begin(), actualOrder.end(), 0);
+    std::sort(actualOrder.begin(), actualOrder.end(),
+              [&actualStrides] (size_t ind_l, size_t ind_r) {
+                  return actualStrides[ind_l] > actualStrides[ind_r];
+              });
+
+    std::vector<size_t> refOrder(refDesc.data.ndims);
+    std::iota(refOrder.begin(), refOrder.end(), 0);
+    std::sort(refOrder.begin(), refOrder.end(),
+              [&refStrides] (size_t ind_l, size_t ind_r) {
+                  return refStrides[ind_l] > refStrides[ind_r];
+              });
+
+    if (actualOrder != refOrder) {
+        return false;
+    }
+
+    return true;
+}
+
+dnnl::memory::format_tag get_format_by_desc(dnnl::memory::desc desc) {
+    // TODO [OneDNN]: Previously it was a field of tdesc, but now the brute
+    //                force search here. Please avoid of using this method.
+    const auto ndims = desc.dims().size();
+
+    // There are no suitable format_tag for this
+    if (ndims == 0 || ndims > 6)
+        return dnnl::memory::format_tag::undef;
+
+    for (const auto fmt : form_tags_by_ndims.at(static_cast<int>(ndims))) {
+        if (isSame(desc, fmt))
+            return fmt;
+    }
+
+    return dnnl::memory::format_tag::undef;
+}
+
+dnnl::algorithm convert_activation_func(cldnn::activation_func func) {
+    switch (func) {
+        case cldnn::activation_func::relu: return dnnl::algorithm::eltwise_relu;
+        case cldnn::activation_func::elu: return dnnl::algorithm::eltwise_elu;
+        case cldnn::activation_func::logistic: return dnnl::algorithm::eltwise_logistic;
+        case cldnn::activation_func::clamp: return dnnl::algorithm::eltwise_clip;
+        case cldnn::activation_func::relu_negative_slope: return dnnl::algorithm::eltwise_relu;
+        case cldnn::activation_func::hyperbolic_tan: return dnnl::algorithm::eltwise_tanh;
+        case cldnn::activation_func::swish: return dnnl::algorithm::eltwise_swish;
+        case cldnn::activation_func::abs: return dnnl::algorithm::eltwise_abs;
+        default: throw std::runtime_error("Unsupported activation func for onednn primitive " + std::to_string(static_cast<int>(func)));
+    }
+}
+
+cldnn::format convert_format(dnnl::memory::format_tag fmt, bool is_grouped) {
+    if (is_grouped) {
+        switch (fmt) {
+        case dnnl::memory::format_tag::abcde: return cldnn::format::goiyx;
+        case dnnl::memory::format_tag::Abcde16a: return cldnn::format::gs_oiyx_gsv16;
+        case dnnl::memory::format_tag::Abcde32a: return cldnn::format::gs_oiyx_gsv32;
+        case dnnl::memory::format_tag::aCBde16c16b: return cldnn::format::g_is_os_yx_isv16_osv16;
+        default: throw std::runtime_error(std::string("Unsupported grouped onednn fmt ") + dnnl_fmt_tag2str((dnnl_format_tag_t)fmt));
+        }
+    } else {
+        switch (fmt) {
+        case dnnl::memory::format_tag::abcd: return cldnn::format::oiyx;
+        case dnnl::memory::format_tag::BAcd16b16a: return cldnn::format::is_os_yx_isv16_osv16;
+        case dnnl::memory::format_tag::ABcd16b16a: return cldnn::format::os_is_yx_isv16_osv16;
+        case dnnl::memory::format_tag::abcde: return cldnn::format::oizyx;
+        default: throw std::runtime_error(std::string("Unsupported onednn fmt ") + dnnl_fmt_tag2str((dnnl_format_tag_t)fmt));
+        }
+    }
+}
+
+}  // namespace onednn
+}  // namespace cldnn
diff --git a/inference-engine/thirdparty/clDNN/src/impls/onednn/utils.hpp b/inference-engine/thirdparty/clDNN/src/impls/onednn/utils.hpp
new file mode 100644
index 00000000000..1af861605ce
--- /dev/null
+++ b/inference-engine/thirdparty/clDNN/src/impls/onednn/utils.hpp
@@ -0,0 +1,36 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <oneapi/dnnl/dnnl.hpp>
+
+#include <cldnn/runtime/layout.hpp>
+#include <cldnn/runtime/engine.hpp>
+#include <cldnn/runtime/memory.hpp>
+#include <cldnn/primitives/activation.hpp>
+
+namespace cldnn {
+namespace onednn {
+
+// common utils
+template <typename T>
+cldnn::memory::ptr convert_zp_data_to_s32(const memory::ptr zp_memory);
+cldnn::format default_fmt_for_dims(size_t dims, bool is_grouped = false);
+
+// cldnn -> onednn
+dnnl::memory::dims convert_tensor(cldnn::tensor t, size_t dims = 2, bool is_grouped = false);
+dnnl::memory::dims convert_spatials(cldnn::tensor t, size_t dims = 2);
+dnnl::memory::dims flatten_tensor(cldnn::tensor t);
+dnnl::memory::data_type convert_data_type(cldnn::data_types dt);
+dnnl::memory::format_tag convert_data_format(cldnn::format fmt);
+dnnl::memory::desc layout_to_memory_desc(cldnn::layout l, dnnl::memory::format_tag target_fmt = dnnl::memory::format_tag::undef, bool flatten = false);
+dnnl::memory::format_tag get_format_by_desc(dnnl::memory::desc desc);
+dnnl::algorithm convert_activation_func(cldnn::activation_func func);
+
+// onednn -> cldnn
+cldnn::format convert_format(dnnl::memory::format_tag fmt, bool is_grouped = false);
+
+}  // namespace onednn
+}  // namespace cldnn
diff --git a/inference-engine/thirdparty/clDNN/src/include/generic_layer.hpp b/inference-engine/thirdparty/clDNN/src/include/generic_layer.hpp
index 79f0616b916..b7d84a211c1 100644
--- a/inference-engine/thirdparty/clDNN/src/include/generic_layer.hpp
+++ b/inference-engine/thirdparty/clDNN/src/include/generic_layer.hpp
@@ -35,8 +35,9 @@ struct generic_layer : public primitive_base<generic_layer> {
                   const primitive_id& input,
                   const layout& output_layout,
                   const kernel_selector::generic_kernel_params& generic_params,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), output_layout(output_layout), generic_params(generic_params) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), output_layout(output_layout), generic_params(generic_params) {}
 
     /// @brief Requested memory layout.
     layout output_layout;
diff --git a/inference-engine/thirdparty/clDNN/src/include/primitive_inst.h b/inference-engine/thirdparty/clDNN/src/include/primitive_inst.h
index 863d2267dc1..d65f92f50fc 100644
--- a/inference-engine/thirdparty/clDNN/src/include/primitive_inst.h
+++ b/inference-engine/thirdparty/clDNN/src/include/primitive_inst.h
@@ -21,6 +21,9 @@
 
 namespace cldnn {
 
+// checks if any user in a list is a cpu primitive
+bool is_any_user_cpu(const std::list<const program_node*>& users);
+
 class primitive_inst;
 
 template <class PType>
@@ -43,6 +46,7 @@ struct primitive_impl {
         : _weights_reorder_params(params), _kernel_name(kernel_name) {}
     virtual ~primitive_impl() = default;
 
+    virtual std::vector<layout> get_internal_buffer_layouts() const = 0;
     virtual void set_arguments(primitive_inst& instance) = 0;
     virtual event::ptr execute(const std::vector<event::ptr>& events, primitive_inst& instance) = 0;
     virtual bool validate(const primitive_inst& instance) const = 0;
@@ -83,6 +87,7 @@ public:
     primitive_type_id type() const { return _node.type(); }
     primitive_id id() const { return _node.id(); }
     primitive_id org_id() const { return _node.get_org_primitive_id(); }
+    const primitive_id& get_ext_prim_id() const { return _node.get_ext_prim_id(); }
     bool can_be_optimized() const { return _node.can_be_optimized(); }
     std::shared_ptr<const primitive> desc() const { return _node.get_primitive(); }
     program_node const& get_node() const { return _node; }
@@ -110,6 +115,7 @@ public:
     event::ptr execute(const std::vector<event::ptr>& events);
     void init_kernels();
     void set_arguments();
+
     bool validate() const {
         if (_impl == nullptr)
             throw std::invalid_argument("[Internal cldnn error].  Validation method for nullptr impl is not allowed.");
@@ -140,6 +146,14 @@ public:
         return _node.is_output();
     }
 
+    bool mem_allocated() const {
+        return _mem_allocated;
+    }
+
+    void allocate_internal_buffers();
+
+    std::vector<memory::cptr> get_intermediates_memories() const { return _intermediates_memory; }
+
 protected:
     primitive_inst(network& network, program_node const& node, bool allocate_memory);
 
@@ -166,10 +180,13 @@ protected:
     // depending on reshape_node.is_in_place())
     memory::ptr _output;
 
+    std::vector<memory::cptr> _intermediates_memory;
+
     bool _output_changed;  // todo: implement output reuse if neither of inputs has changed
     bool _has_valid_input =
         true;  // by default all primitives has valid inputs, exception is input_layout (see input_layout_inst)
     bool _has_mutable_input = false;
+    bool _mem_allocated = false;
 
     memory::ptr allocate_output();
     static std::vector<std::shared_ptr<primitive_inst>> build_exec_deps(
@@ -206,6 +223,14 @@ private:
         return execute_impl(event, reinterpret_cast<typed_primitive_inst<PType>&>(instance));
     }
 
+    std::vector<layout> get_internal_buffer_layouts() const override {
+        return get_internal_buffer_layouts_impl();
+    }
+
+    virtual std::vector<layout> get_internal_buffer_layouts_impl() const {
+        return {};
+    }
+
     void set_arguments(primitive_inst& instance) override {
         if (instance.type() != PType::type_id())
             throw std::invalid_argument("Implementation type does not match primitive type");
@@ -216,7 +241,6 @@ private:
         return set_arguments_impl(reinterpret_cast<typed_primitive_inst<PType>&>(instance));
     }
 
-
     virtual void set_arguments_impl(typed_primitive_inst<PType>& /*instance*/) {}
     virtual event::ptr execute_impl(const std::vector<event::ptr>& event,
                                          typed_primitive_inst<PType>& instance) = 0;
diff --git a/inference-engine/thirdparty/clDNN/src/include/program_node.h b/inference-engine/thirdparty/clDNN/src/include/program_node.h
index 7974e90aeb5..9b11846ee6e 100644
--- a/inference-engine/thirdparty/clDNN/src/include/program_node.h
+++ b/inference-engine/thirdparty/clDNN/src/include/program_node.h
@@ -82,6 +82,8 @@ public:
     virtual primitive_type_id type() const { return desc->type; }
     virtual std::shared_ptr<kernel_selector::fuse_params> get_fuse_params() const { return nullptr; }
 
+    const primitive_id& get_ext_prim_id() const { return desc->ext_prim_id; }
+
     template <class PType>
     bool is_type() const {
         static_assert(
diff --git a/inference-engine/thirdparty/clDNN/src/include/to_string_utils.h b/inference-engine/thirdparty/clDNN/src/include/to_string_utils.h
index 29967531887..5307201fa05 100644
--- a/inference-engine/thirdparty/clDNN/src/include/to_string_utils.h
+++ b/inference-engine/thirdparty/clDNN/src/include/to_string_utils.h
@@ -91,6 +91,14 @@ inline std::string fmt_to_str(format fmt) {
             return "fs_b_yx_fsv32";
         case format::bs_fs_yx_bsv16_fsv16:
             return "bs_fs_yx_bsv16_fsv16";
+        case format::bs_fs_yx_bsv32_fsv16:
+            return "bs_fs_yx_bsv32_fsv16";
+        case format::bs_fs_yx_bsv4_fsv2:
+            return "bs_fs_yx_bsv4_fsv2";
+        case format::bs_fs_yx_bsv4_fsv4:
+            return "bs_fs_yx_bsv4_fsv4";
+        case format::bs_fs_yx_bsv32_fsv32:
+            return "bs_fs_yx_bsv32_fsv32";
         case format::b_fs_zyx_fsv16:
             return "b_fs_zyx_fsv16";
         case format::bs_fs_zyx_bsv16_fsv16:
@@ -122,6 +130,10 @@ inline std::string fmt_to_str(format fmt) {
             return "image_2d_weights_winograd_6x3_s1_fbxyb";
         case format::image_2d_weights_winograd_6x3_s1_xfbyb:
             return "image_2d_weights_winograd_6x3_s1_xfbyb";
+        case format::os_yxi_osv16:
+            return "os_yxi_osv16";
+        case format::o_is_yx_isv16:
+            return "o_is_yx_isv16";
         case format::os_iyx_osv16:
             return "os_iyx_osv16";
         case format::os_is_yx_osv16_isv16:
@@ -142,6 +154,14 @@ inline std::string fmt_to_str(format fmt) {
             return "os_is_zyx_isa8_osv8_isv4";
         case format::os_is_zyx_isa8_osv16_isv4:
             return "os_is_zyx_isa8_osv16_isv4";
+        case format::os_is_yx_osa4_isa8_osv8_isv2:
+            return "os_is_yx_osa4_isa8_osv8_isv2";
+        case format::g_os_is_yx_osa4_isa8_osv8_isv2:
+            return "g_os_is_yx_osa4_isa8_osv8_isv2";
+        case format::g_os_is_yx_osa4_isa8_osv8_isv4:
+            return "g_os_is_yx_osa4_isa8_osv8_isv4";
+        case format::os_is_yx_osa4_isa8_osv8_isv4:
+            return "os_is_yx_osa4_isa8_osv8_isv4";
         case format::os_is_yx_osa4_isa8_osv8_isv4_swizzled_by_4:
             return "os_is_yx_osa4_isa8_osv8_isv4_swizzled_by_4";
         case format::os_is_zyx_osa4_isa8_osv8_isv4_swizzled_by_4:
@@ -150,6 +170,10 @@ inline std::string fmt_to_str(format fmt) {
             return "os_is_yx_isa8_osv8_isv4_swizzled_by_4";
         case format::is_o32_yx_isv32_swizzled_by_4:
             return "is_o32_yx_isv32_swizzled_by_4";
+        case format::os_is_yx_osv8_isv2:
+            return "os_is_yx_osv8_isv2";
+        case format::os_is_yx_osv8_isv4:
+            return "os_is_yx_osv8_isv4";
         case format::os_is_yx_osv16_isv4:
             return "os_is_yx_osv16_isv4";
         case format::os_is_yx_osv32_isv4_swizzled_by_2:
diff --git a/inference-engine/thirdparty/clDNN/src/kernel_selector_helper.cpp b/inference-engine/thirdparty/clDNN/src/kernel_selector_helper.cpp
index 77becaa27ba..fae8a36e1ee 100644
--- a/inference-engine/thirdparty/clDNN/src/kernel_selector_helper.cpp
+++ b/inference-engine/thirdparty/clDNN/src/kernel_selector_helper.cpp
@@ -132,6 +132,14 @@ kernel_selector::data_layout to_data_layout(format f) {
             return kernel_selector::data_layout::bs_fs_zyx_bsv16_fsv16;
         case format::bs_fs_yx_bsv16_fsv16:
             return kernel_selector::data_layout::bs_fs_yx_bsv16_fsv16;
+        case format::bs_fs_yx_bsv32_fsv16:
+            return kernel_selector::data_layout::bs_fs_yx_bsv32_fsv16;
+        case format::bs_fs_yx_bsv4_fsv4:
+            return kernel_selector::data_layout::bs_fs_yx_bsv4_fsv4;
+        case format::bs_fs_yx_bsv4_fsv2:
+            return kernel_selector::data_layout::bs_fs_yx_bsv4_fsv2;
+        case format::bs_fs_yx_bsv32_fsv32:
+            return kernel_selector::data_layout::bs_fs_yx_bsv32_fsv32;
         case format::nv12:
             return kernel_selector::data_layout::nv12;
         case format::image_2d_rgba:
@@ -179,6 +187,14 @@ cldnn::format from_data_layout(kernel_selector::data_layout l) {
             return cldnn::format::b_fs_yx_fsv4;
         case kernel_selector::data_layout::bs_fs_yx_bsv16_fsv16:
             return cldnn::format::bs_fs_yx_bsv16_fsv16;
+        case kernel_selector::data_layout::bs_fs_yx_bsv32_fsv16:
+            return cldnn::format::bs_fs_yx_bsv32_fsv16;
+        case kernel_selector::data_layout::bs_fs_yx_bsv4_fsv2:
+            return cldnn::format::bs_fs_yx_bsv4_fsv2;
+        case kernel_selector::data_layout::bs_fs_yx_bsv4_fsv4:
+            return cldnn::format::bs_fs_yx_bsv4_fsv4;
+        case kernel_selector::data_layout::bs_fs_yx_bsv32_fsv32:
+            return cldnn::format::bs_fs_yx_bsv32_fsv32;
         case kernel_selector::data_layout::nv12:
             return cldnn::format::nv12;
         case kernel_selector::data_layout::image_2d_rgba:
@@ -202,6 +218,10 @@ kernel_selector::weights_layout to_weights_layout(format f, bool is_grouped) {
         case format::yxfb:
         case format::yxio:
             return kernel_selector::weights_layout::yxio;
+        case format::os_yxi_osv16:
+            return kernel_selector::weights_layout::os_yxi_osv16;
+        case format::o_is_yx_isv16:
+            return kernel_selector::weights_layout::o_is_yx_isv16;
         case format::os_iyx_osv16:
             return kernel_selector::weights_layout::os_iyx_osv16;
         case format::os_is_yx_osv16_isv16:
@@ -224,6 +244,14 @@ kernel_selector::weights_layout to_weights_layout(format f, bool is_grouped) {
             return kernel_selector::weights_layout::image_2d_weights_winograd_6x3_s1_fbxyb;
         case format::image_2d_weights_winograd_6x3_s1_xfbyb:
             return kernel_selector::weights_layout::image_2d_weights_winograd_6x3_s1_xfbyb;
+        case format::os_is_yx_osa4_isa8_osv8_isv2:
+            return kernel_selector::weights_layout::os_is_yx_osa4_isa8_osv8_isv2;
+        case format::g_os_is_yx_osa4_isa8_osv8_isv2:
+            return kernel_selector::weights_layout::g_os_is_yx_osa4_isa8_osv8_isv2;
+        case format::g_os_is_yx_osa4_isa8_osv8_isv4:
+            return kernel_selector::weights_layout::g_os_is_yx_osa4_isa8_osv8_isv4;
+        case format::os_is_yx_osa4_isa8_osv8_isv4:
+            return kernel_selector::weights_layout::os_is_yx_osa4_isa8_osv8_isv4;
         case format::os_is_yx_isa8_osv8_isv4:
             return kernel_selector::weights_layout::os_is_yx_isa8_osv8_isv4;
         case format::os_is_yx_isa8_osv16_isv4:
@@ -232,6 +260,10 @@ kernel_selector::weights_layout to_weights_layout(format f, bool is_grouped) {
             return kernel_selector::weights_layout::os_is_zyx_isa8_osv8_isv4;
         case format::os_is_zyx_isa8_osv16_isv4:
             return kernel_selector::weights_layout::os_is_zyx_isa8_osv16_isv4;
+        case format::os_is_yx_osv8_isv2:
+            return kernel_selector::weights_layout::os_is_yx_osv8_isv2;
+        case format::os_is_yx_osv8_isv4:
+            return kernel_selector::weights_layout::os_is_yx_osv8_isv4;
         case format::os_is_yx_osa4_isa8_osv8_isv4_swizzled_by_4:
             return kernel_selector::weights_layout::os_is_yx_osa4_isa8_osv8_isv4_swizzled_by_4;
         case format::os_is_zyx_osa4_isa8_osv8_isv4_swizzled_by_4:
@@ -354,6 +386,10 @@ cldnn::format::type from_weights_layout(kernel_selector::weights_layout l) {
             return cldnn::format::iyxo;
         case kernel_selector::weights_layout::yxio:
             return cldnn::format::yxfb;
+        case kernel_selector::weights_layout::os_yxi_osv16:
+            return cldnn::format::os_yxi_osv16;
+        case kernel_selector::weights_layout::o_is_yx_isv16:
+            return cldnn::format::o_is_yx_isv16;
         case kernel_selector::weights_layout::os_iyx_osv16:
             return cldnn::format::os_iyx_osv16;
         case kernel_selector::weights_layout::os_is_yx_isv16_osv16:
@@ -384,6 +420,14 @@ cldnn::format::type from_weights_layout(kernel_selector::weights_layout l) {
             return cldnn::format::image_2d_weights_winograd_6x3_s1_fbxyb;
         case kernel_selector::weights_layout::image_2d_weights_winograd_6x3_s1_xfbyb:
             return cldnn::format::image_2d_weights_winograd_6x3_s1_xfbyb;
+        case kernel_selector::weights_layout::os_is_yx_osa4_isa8_osv8_isv2:
+            return cldnn::format::os_is_yx_osa4_isa8_osv8_isv2;
+        case kernel_selector::weights_layout::g_os_is_yx_osa4_isa8_osv8_isv2:
+            return cldnn::format::g_os_is_yx_osa4_isa8_osv8_isv2;
+        case kernel_selector::weights_layout::g_os_is_yx_osa4_isa8_osv8_isv4:
+            return cldnn::format::g_os_is_yx_osa4_isa8_osv8_isv4;
+        case kernel_selector::weights_layout::os_is_yx_osa4_isa8_osv8_isv4:
+            return cldnn::format::os_is_yx_osa4_isa8_osv8_isv4;
         case kernel_selector::weights_layout::os_is_yx_isa8_osv8_isv4:
             return cldnn::format::os_is_yx_isa8_osv8_isv4;
         case kernel_selector::weights_layout::os_is_zyx_isa8_osv8_isv4:
@@ -422,6 +466,10 @@ cldnn::format::type from_weights_layout(kernel_selector::weights_layout l) {
             return cldnn::format::is_os_zyx_isv16_osv16;
         case kernel_selector::weights_layout::is_os_yx_isv16_osv16:
             return cldnn::format::is_os_yx_isv16_osv16;
+        case kernel_selector::weights_layout::os_is_yx_osv8_isv2:
+            return cldnn::format::os_is_yx_osv8_isv2;
+        case kernel_selector::weights_layout::os_is_yx_osv8_isv4:
+            return cldnn::format::os_is_yx_osv8_isv4;
         case kernel_selector::weights_layout::os_is_zyx_isv8_osv16_isv2:
             return cldnn::format::os_is_zyx_isv8_osv16_isv2;
         case kernel_selector::weights_layout::os_zyxi_osv16:
diff --git a/inference-engine/thirdparty/clDNN/src/layout_optimizer.cpp b/inference-engine/thirdparty/clDNN/src/layout_optimizer.cpp
index a6fcbeaa19f..c14f6417395 100644
--- a/inference-engine/thirdparty/clDNN/src/layout_optimizer.cpp
+++ b/inference-engine/thirdparty/clDNN/src/layout_optimizer.cpp
@@ -955,6 +955,9 @@ bool layout_optimizer::is_format_optimized(const convolution_node& node, const f
             return convolution_fs_b_yx_fsv32_opt(input_layout, output_layout, weights_layout, prim);
         case format::bs_fs_yx_bsv16_fsv16:
             return convolution_bs_fs_yx_bsv16_fsv16_opt(input_layout, output_layout, weights_layout, prim);
+        case format::bs_fs_yx_bsv32_fsv32:
+        case format::bs_fs_yx_bsv32_fsv16:
+            return false;
         default:
             throw std::invalid_argument(
                 "[Layout optimizer] Other formats in is_format_optimized(...) method are not implemented!");
diff --git a/inference-engine/thirdparty/clDNN/src/network.cpp b/inference-engine/thirdparty/clDNN/src/network.cpp
index 9692bd7ee73..5c60a442992 100644
--- a/inference-engine/thirdparty/clDNN/src/network.cpp
+++ b/inference-engine/thirdparty/clDNN/src/network.cpp
@@ -470,12 +470,6 @@ void network::allocate_primitives() {
     for (auto node : _program->get_processing_order()) {
         nodes_to_allocate.push_back(_program->get_node_ptr(node->id()));
     }
-    std::sort(nodes_to_allocate.begin(),
-              nodes_to_allocate.end(),
-              [](std::shared_ptr<program_node> const& lhs, std::shared_ptr<program_node> const& rhs) {
-                  return (lhs->get_output_layout().bytes_count() > rhs->get_output_layout().bytes_count());
-              });
-
     for (auto const& node : nodes_to_allocate) {
         allocate_primitive_instance(*node);
     }
@@ -662,6 +656,21 @@ const program::graph_optimizer_info& network::get_optimizer_passes_info() const
     return _program->get_optimizer_passes_info();
 }
 
+std::map<primitive_id, primitive_id> network::get_ext_id_mapping() const {
+    std::map<primitive_id, primitive_id> result;
+    for (auto& prim : _primitives) {
+        result.emplace(prim.first, prim.second->get_ext_prim_id());
+    }
+    for (auto& opt_id : _program->get_optimized_out()) {
+        std::string ext_id = opt_id;
+        if (opt_id.find(":") != std::string::npos) {
+            ext_id = opt_id.substr(opt_id.find(":") + 1, opt_id.length());
+        }
+        result.emplace(opt_id, ext_id);
+    }
+    return result;
+}
+
 std::shared_ptr<primitive_inst> network::get_primitive(const primitive_id& id) {
     if (!_primitives.count(id))
         allocate_primitive_instance(_program->get_node(id));
diff --git a/inference-engine/thirdparty/clDNN/src/primitive_inst.cpp b/inference-engine/thirdparty/clDNN/src/primitive_inst.cpp
index b6c65a5b739..082dc3e8f2a 100644
--- a/inference-engine/thirdparty/clDNN/src/primitive_inst.cpp
+++ b/inference-engine/thirdparty/clDNN/src/primitive_inst.cpp
@@ -15,6 +15,7 @@
 #include "cldnn/runtime/memory.hpp"
 
 #include "cldnn/runtime/error_handler.hpp"
+#include "cldnn/runtime/debug_configuration.hpp"
 #include "json_object.h"
 #include <string>
 #include <stack>
@@ -24,6 +25,27 @@
 
 namespace cldnn {
 
+bool is_user_cpu(const program_node* user) {
+    if (user->can_be_optimized()) {
+        auto users = user->get_users();
+        for (const auto& u : users) {
+            if (is_user_cpu(u)) {
+                return true;
+            }
+        }
+        return false;
+    }
+    return user->get_selected_impl()->is_cpu();
+}
+
+bool is_any_user_cpu(const std::list<const program_node*>& users) {
+    for (const auto& user : users) {
+        if (is_user_cpu(user))
+            return true;
+    }
+    return false;
+}
+
 uint32_t primitive_inst::get_network_id() const { return _network.get_id(); }
 
 void primitive_inst::check_memory_to_set(const memory& mem, const layout& layout) const {
@@ -127,7 +149,8 @@ void primitive_inst::build_deps() {
 }
 
 primitive_inst::primitive_inst(network& network, program_node const& node, bool allocate_memory)
-    : _network(network), _node(node), _impl(node.get_selected_impl() ? node.get_selected_impl()->clone() : nullptr), _output(), _output_changed(false) {
+    : _network(network), _node(node), _impl(node.get_selected_impl() ? node.get_selected_impl()->clone() : nullptr),
+      _output(), _output_changed(false), _mem_allocated(allocate_memory) {
     if (allocate_memory) {
         // In case when output is mutable_data primitive, and other users dependencies are only used for
         // suychronization, The output memory of such primitive will be fused with mutable_data
@@ -158,37 +181,118 @@ primitive_inst::primitive_inst(network& network, program_node const& node, bool
         } else {
             _output = allocate_output();
         }
+
+        // Allocate internal buffer
+        allocate_internal_buffers();
+    }
+}
+
+void primitive_inst::allocate_internal_buffers(void) {
+    if (_impl == nullptr) return;
+    const auto& ibuf_layouts = _impl->get_internal_buffer_layouts();
+    if (ibuf_layouts.empty()) return;
+
+    auto device_mem_acc = [&](size_t a, std::shared_ptr<primitive_inst> b) {
+        if (!b->mem_allocated()) return a;
+        if (b->output_memory().get_allocation_type() == allocation_type::usm_device ||
+            b->output_memory().get_allocation_type() == allocation_type::cl_mem)
+            return a + b->output_memory().size();
+        else
+            return a;
+    };
+
+    auto& engine = get_network().get_engine();
+    bool input_device_mem = false;
+
+    // NOTE: Currently the ocl driver aborts at runtime when there are layers using device memory close to max size within multiple streams.
+    // Decided the limitation as 85 % empirically, but still it needs further investigation.
+    const auto& inst_deps = _network.get_primitives(_node.get_dependencies());
+
+    auto total_device_mem_size = std::accumulate(inst_deps.begin(), inst_deps.end(), 0, device_mem_acc);
+    if (_output->get_allocation_type() ==  allocation_type::usm_device) {
+        total_device_mem_size += _output->size();
+    }
+
+    int64_t available_device_mem_size = engine.get_device_info().max_global_mem_size - total_device_mem_size;
+    // check if there is any device mem input
+    if (engine.supports_allocation(allocation_type::usm_device)) {
+        for (const auto& dep : inst_deps) {
+            if (dep->output_memory().get_allocation_type() == allocation_type::usm_device) {
+                input_device_mem = true;
+                break;
+            }
+        }
+    }
+
+    for (auto layout : ibuf_layouts) {
+        GPU_DEBUG_GET_INSTANCE(debug_config);
+        GPU_DEBUG_IF(debug_config->verbose >= 2) {
+            GPU_DEBUG_COUT << "[" << _node.id() << ": internal buf]" << std::endl;
+        }
+        if (input_device_mem && (available_device_mem_size - (int64_t)layout.bytes_count() >= 0))
+            _intermediates_memory.push_back(engine.allocate_memory(layout, allocation_type::usm_device));
+        else
+            _intermediates_memory.push_back(engine.allocate_memory(layout, allocation_type::usm_host));
     }
 }
 
 memory::ptr primitive_inst::allocate_output() {
     auto layout = _node.get_output_layout();
     auto& engine = get_network().get_engine();
+    const auto& inst_deps = _network.get_primitives(_node.get_dependencies());
+    auto device_mem_acc = [&](size_t a, std::shared_ptr<primitive_inst> b) {
+        if (!b->mem_allocated()) return a;
+        if (b->output_memory().get_allocation_type() == allocation_type::usm_device
+            || b->output_memory().get_allocation_type() == allocation_type::cl_mem)
+            return a + b->output_memory().size();
+        else
+            return a;
+    };
+
+    bool usm_device_allocatable = true;
+    const auto& total_device_input_mem_size = std::accumulate(inst_deps.begin(), inst_deps.end(), 0, device_mem_acc);
+    if (total_device_input_mem_size > engine.get_device_info().max_global_mem_size)
+        usm_device_allocatable = false;
 
     // For outputs, cpu prim we want to have lockable alloc type
     // Also if the successor of a node is an cpu, then memory needs to be lockable.
     auto use_lockable_memory = _node.is_output() || _node.get_selected_impl()->is_cpu()
                                || std::any_of(_node.get_users().begin(), _node.get_users().end(),
-                                              [](const program_node* n) {return n->get_selected_impl()->is_cpu() || n->can_be_optimized(); })
-                               || !engine.supports_allocation(allocation_type::usm_device);
-    allocation_type alloc_type = use_lockable_memory ?
-                                 engine.get_lockable_preffered_memory_allocation_type(layout.format.is_image_2d())
-                                                     : allocation_type::usm_device;
+                                              [](const program_node* n) {
+                                     return n->get_selected_impl()->is_cpu() || is_any_user_cpu(n->get_users());
+                                  }) || !engine.supports_allocation(allocation_type::usm_device);
+
+    GPU_DEBUG_GET_INSTANCE(debug_config);
+    const auto& lockable_mem_type = engine.get_lockable_preffered_memory_allocation_type(layout.format.is_image_2d());
+    const auto& alloc_type = use_lockable_memory ? lockable_mem_type
+                             : usm_device_allocatable ? allocation_type::usm_device : lockable_mem_type;
 
     if (!_network.is_internal() && (_node.can_be_optimized() || _node.is_type<generic_layer>())) {
+        GPU_DEBUG_IF(debug_config->verbose >= 2) {
+            GPU_DEBUG_COUT << "[" << _node.id() << ": output]" << std::endl;
+        }
         return _network.get_memory_from_pool(layout,
                                              _node.id(),
                                              _node.get_memory_dependencies(),
                                              alloc_type,
                                              false);
     } else if (_network.is_internal() && _node.is_output() && _node.is_type<generic_layer>() &&
-               engine.supports_allocation(allocation_type::usm_device)) {
+               engine.supports_allocation(allocation_type::usm_device) && usm_device_allocatable) {
+        GPU_DEBUG_IF(debug_config->verbose >= 2) {
+            GPU_DEBUG_COUT << "[" << _node.id() << ": output]" << std::endl;
+        }
         return engine.allocate_memory(layout, allocation_type::usm_device, false);
     } else if (_network.is_internal() && !_node.is_output() && _node.is_type<input_layout>()) {
         // Skip memory reset for input_layout primitives, since data will be copied from cldnn::data primitive
         // or just reuse primitive's memory
+        GPU_DEBUG_IF(debug_config->verbose >= 2) {
+            GPU_DEBUG_COUT << "[" << _node.id() << ": constant]" << std::endl;
+        }
         return engine.allocate_memory(layout, alloc_type, false);
     } else if (_network.is_internal() || (!_node.can_share_buffer()) || _node.can_be_optimized() || _node.is_output()) {
+        GPU_DEBUG_IF(debug_config->verbose >= 2) {
+            GPU_DEBUG_COUT << "[" << _node.id() << ": output]" << std::endl;
+        }
         return engine.allocate_memory(layout, alloc_type);
     } else {
         return _network.get_memory_from_pool(layout,
diff --git a/inference-engine/thirdparty/clDNN/src/program.cpp b/inference-engine/thirdparty/clDNN/src/program.cpp
index 82b0f9b111f..8565f10acb2 100644
--- a/inference-engine/thirdparty/clDNN/src/program.cpp
+++ b/inference-engine/thirdparty/clDNN/src/program.cpp
@@ -64,6 +64,9 @@
 #include "impls/ocl/register.hpp"
 #include "impls/cpu/register.hpp"
 #include "impls/common/register.hpp"
+#ifdef ENABLE_ONEDNN_FOR_GPU
+#include "impls/onednn/register.hpp"
+#endif
 
 #include "kernel_base.h"
 
@@ -130,6 +133,9 @@ void program::init_primitives() {
         common::register_implementations();
         cpu::register_implementations();
         ocl::register_implementations();
+#ifdef ENABLE_ONEDNN_FOR_GPU
+        onednn::register_implementations();
+#endif
         is_initialized = true;
     }
 }
@@ -602,6 +608,10 @@ void program::transfer_memory_to_device() {
 
 
             if (alloc_type == allocation_type::usm_host || alloc_type == allocation_type::usm_shared) {
+                GPU_DEBUG_GET_INSTANCE(debug_config);
+                GPU_DEBUG_IF(debug_config->verbose >= 2) {
+                    GPU_DEBUG_COUT << "[" << data_node.id() << ": constant]" << std::endl;
+                }
                 // Allocate and transfer memory
                 auto device_mem = mem.get_engine()->allocate_memory(data_node_layout, allocation_type::usm_device, false);
                 device_mem->copy_from(get_stream(), mem);
@@ -893,6 +903,7 @@ void program::replace(program_node& old_node, program_node& new_node) {
     new_node.constant = old_node.constant;
     new_node.data_flow = old_node.data_flow;
     new_node.user_mark = old_node.user_mark;
+    const_cast<primitive_id&>(new_node.desc->ext_prim_id) = old_node.desc->ext_prim_id;
 
     processing_order.insert(&old_node, &new_node);
     if (processing_order.get_processing_iterator(old_node) != processing_order.end())
diff --git a/inference-engine/thirdparty/clDNN/src/program_helpers.cpp b/inference-engine/thirdparty/clDNN/src/program_helpers.cpp
index 6ec5ed03b52..067c6f00f20 100644
--- a/inference-engine/thirdparty/clDNN/src/program_helpers.cpp
+++ b/inference-engine/thirdparty/clDNN/src/program_helpers.cpp
@@ -143,6 +143,14 @@ std::pair<bool, bool> program_helpers::are_layouts_identical(layout const& l1, l
         (l2.format == format::b_fs_zyx_fsv32 && l1.format != format::b_fs_zyx_fsv32) ||
         (l1.format == format::b_fs_zyx_fsv16 && l2.format != format::b_fs_zyx_fsv16) ||
         (l2.format == format::b_fs_zyx_fsv16 && l1.format != format::b_fs_zyx_fsv16) ||
+        (l1.format == format::bs_fs_yx_bsv4_fsv4 && l2.format != format::bs_fs_yx_bsv4_fsv4) ||
+        (l2.format == format::bs_fs_yx_bsv4_fsv4 && l1.format != format::bs_fs_yx_bsv4_fsv4) ||
+        (l1.format == format::bs_fs_yx_bsv4_fsv2 && l2.format != format::bs_fs_yx_bsv4_fsv2) ||
+        (l2.format == format::bs_fs_yx_bsv4_fsv2 && l1.format != format::bs_fs_yx_bsv4_fsv2) ||
+        (l1.format == format::bs_fs_yx_bsv32_fsv16 && l2.format != format::bs_fs_yx_bsv32_fsv16) ||
+        (l2.format == format::bs_fs_yx_bsv32_fsv16 && l1.format != format::bs_fs_yx_bsv32_fsv16) ||
+        (l1.format == format::bs_fs_yx_bsv32_fsv32 && l2.format != format::bs_fs_yx_bsv32_fsv32) ||
+        (l2.format == format::bs_fs_yx_bsv32_fsv32 && l1.format != format::bs_fs_yx_bsv32_fsv32) ||
         (l1.format == format::bs_fs_yx_bsv16_fsv16 && l2.format != format::bs_fs_yx_bsv16_fsv16) ||
         (l2.format == format::bs_fs_yx_bsv16_fsv16 && l1.format != format::bs_fs_yx_bsv16_fsv16) ||
         (l1.format == format::bs_fs_zyx_bsv16_fsv16 && l2.format != format::bs_fs_zyx_bsv16_fsv16) ||
diff --git a/inference-engine/thirdparty/clDNN/tests/module_tests/usm_memory_test.cpp b/inference-engine/thirdparty/clDNN/tests/module_tests/usm_memory_test.cpp
index dd414e9a0c8..6e9fd52da2e 100644
--- a/inference-engine/thirdparty/clDNN/tests/module_tests/usm_memory_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/module_tests/usm_memory_test.cpp
@@ -100,7 +100,7 @@ TEST_P(ctor_test, basic) {
 
 INSTANTIATE_TEST_SUITE_P(cldnn_usm, ctor_test, ::testing::ValuesIn(std::vector<usm_test_params>{
     usm_test_params{ allocation_type::usm_host},
-    usm_test_params{ allocation_type::usm_shared},
+//    usm_test_params{ allocation_type::usm_shared}, // Unsupported
     usm_test_params{ allocation_type::usm_device},
 }));
 
@@ -173,7 +173,7 @@ TEST_P(copy_and_read_buffer, basic) {
 
 INSTANTIATE_TEST_SUITE_P(cldnn_usm, copy_and_read_buffer, ::testing::ValuesIn(std::vector<usm_test_params>{
         usm_test_params{ allocation_type::usm_host },
-        usm_test_params{ allocation_type::usm_shared },
+//        usm_test_params{ allocation_type::usm_shared }, // Unsupported
         usm_test_params{ allocation_type::usm_device },
 }));
 
@@ -256,6 +256,6 @@ TEST_P(fill_buffer, DISABLED_basic) {
 
 INSTANTIATE_TEST_SUITE_P(cldnn_usm, fill_buffer, ::testing::ValuesIn(std::vector<usm_test_params>{
     usm_test_params{ allocation_type::usm_host },
-        usm_test_params{ allocation_type::usm_shared },
+//        usm_test_params{ allocation_type::usm_shared }, // Unsupported
         usm_test_params{ allocation_type::usm_device },
 }));
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/activation_simple_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/activation_simple_gpu_test.cpp
index 742c3061d39..5f54dabf7f4 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/activation_simple_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/activation_simple_gpu_test.cpp
@@ -497,7 +497,7 @@ TEST(activation_f32_fw_gpu, relu_basic_yxfb) {
 
     topology topology(
         input_layout("input", input->get_layout()),
-        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, padding{ { 0, 0, 0, 0 }, 0 }));
+        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, "", padding{ { 0, 0, 0, 0 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
@@ -573,7 +573,7 @@ TEST(activation_f32_fw_gpu, relu_basic_bfzyx) {
 
     topology topology(
         input_layout("input", input->get_layout()),
-        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, padding{ { 0, 0, 0, 0, 0 }, 0 }));
+        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, "", padding{ { 0, 0, 0, 0, 0 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
@@ -983,8 +983,8 @@ TEST(activation_f32_fw_gpu, relu_basic_acosh_yxfb) {
 
     topology topology(
             input_layout("input", input->get_layout()),
-            reorder("reorder", "input", input->get_layout().with_padding(padding{{0, 0, 2, 1}, 0})),
-            activation("relu", "reorder", activation_func::acosh, {0.5f, 0.f}, padding{{0, 0, 0, 0}, 0}));
+            reorder("reorder", "input", input->get_layout().with_padding(padding{ { 0, 0, 2, 1 }, 0 })),
+            activation("relu", "reorder", activation_func::acosh, {0.5f, 0.f}, "", padding{ { 0, 0, 0, 0 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
@@ -1050,7 +1050,7 @@ TEST(activation_f32_fw_gpu, relu_basic_input_padding_yxfb) {
     topology topology(
         input_layout("input", input->get_layout()),
         reorder("reorder", "input", input->get_layout().with_padding(padding{ { 0, 0, 2, 1 }, 0 })),
-        activation("relu", "reorder", activation_func::relu_negative_slope, { 0.5f, 0.f }, padding{ { 0, 0, 0, 0 }, 0 }));
+        activation("relu", "reorder", activation_func::relu_negative_slope, { 0.5f, 0.f }, "", padding{ { 0, 0, 0, 0 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
@@ -1137,7 +1137,7 @@ TEST(activation_f32_fw_gpu, relu_basic_input_padding_bfzyx) {
     topology topology(
         input_layout("input", input->get_layout()),
         reorder("reorder", "input", input->get_layout().with_padding(padding{ { 0, 0, 2, 1, 0 }, 0 })),
-        activation("relu", "reorder", activation_func::relu_negative_slope, { 0.5f, 0.f }, padding{ { 0, 0, 0, 0, 0 }, 0 }));
+        activation("relu", "reorder", activation_func::relu_negative_slope, { 0.5f, 0.f }, "", padding{ { 0, 0, 0, 0, 0 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
@@ -1210,7 +1210,7 @@ TEST(activation_f32_fw_gpu, relu_basic_output_padding_yxfb) {
 
     topology topology(
         input_layout("input", input->get_layout()),
-        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, padding{ { 0, 0, 3, 3 }, 0 }));
+        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, "", padding{ { 0, 0, 3, 3 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/arg_max_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/arg_max_gpu_test.cpp
index d7b4b630201..9f5144d1dc1 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/arg_max_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/arg_max_gpu_test.cpp
@@ -23,7 +23,7 @@ void generic_arg_max_test_xyf(int input_b, int input_f, int input_y, int input_x
     auto input = engine.allocate_memory({ type_to_data_type<Tin>::value, test_input_fmt, input_tensor });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, mode, 1U, axis, sort_type, false, padding(), type_to_data_type<Tout>::value));
+    topology.add(arg_max_min("arg_max", { "input" }, mode, 1U, axis, sort_type, false, "", padding(), type_to_data_type<Tout>::value));
 
     int min_random = -2, max_random = 2;
     VVVVF<Tin> input_rnd = generate_random_4d<Tin>(input_b, input_f, input_y, input_x, min_random, max_random);
@@ -393,7 +393,7 @@ TEST(arg_max_gpu_min_axis_batch, i32) {
     auto input = engine.allocate_memory({ data_types::f32, format::bfyx,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::min, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, padding(), data_types::i32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::min, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, "", padding(), data_types::i32));
 
     std::vector<float> input_vec = {
         //y0x0 y0x1 y1x0 y1x1
@@ -436,7 +436,7 @@ TEST(arg_max_gpu_min_axis_batch_bfzyx, i32) {
     auto input = engine.allocate_memory({ data_types::f32, format::bfzyx,{ batch_num, feature_num, x_size , y_size, z_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::min, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, padding(), data_types::i32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::min, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, "", padding(), data_types::i32));
 
     std::vector<float> input_vec = {
             //y0x0 y0x1 y1x0 y1x1
@@ -478,7 +478,7 @@ TEST(arg_max_gpu_min_axis_y_yxfb, f32) {
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
@@ -542,7 +542,7 @@ TEST(arg_max_gpu_min_axis_batch_yxfb, f32) {
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
@@ -606,7 +606,7 @@ TEST(arg_max_gpu_min_axis_y_yxfb_topk_2, f32) {
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
@@ -735,7 +735,7 @@ TEST(top_k_layer_tests, second_output2) {
     topology.add(input_layout("input", input->get_layout()));
     topology.add(cldnn::data("const", top_k_input));
     topology.add(mutable_data("second_output", second_output));
-    topology.add(arg_max_min("arg_max", { "input", "const", "second_output" }, arg_max_min::max, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input", "const", "second_output" }, arg_max_min::max, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
@@ -825,7 +825,7 @@ TEST(arg_max_gpu_min_axis_y_yxfb_topk_2, sort_by_values) {
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
@@ -899,7 +899,7 @@ TEST(arg_max_gpu_min_axis_y_yxfb_topk_2, sort_by_indices) {
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_indices, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_indices, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/average_unpooling_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/average_unpooling_gpu_test.cpp
index 76741001060..4530093e3c4 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/average_unpooling_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/average_unpooling_gpu_test.cpp
@@ -186,7 +186,7 @@ TEST(average_unpooling_gpu, basic_in2x2x2x1_output_padding) {
 
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(average_unpooling("average_unpooling", "input", { 2, 2, 3, 2 }, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, padding({ 0, 0, 1, 1 }, 0)));
+    topology.add(average_unpooling("average_unpooling", "input", { 2, 2, 3, 2 }, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, "", padding({ 0, 0, 1, 1 }, 0)));
 
     network network(engine, topology);
 
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/binary_convolution_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/binary_convolution_gpu_test.cpp
index 84c37330b5b..f73fd8b19c6 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/binary_convolution_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/binary_convolution_gpu_test.cpp
@@ -364,6 +364,7 @@ TEST(binary_convolution, basic_convolution_1x1_single_packed_channel) {
                                { 1,4,2,2 },
                                0, 0.0f,
                                data_types::f32,
+                               "",
                                padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -447,6 +448,7 @@ TEST(binary_convolution, basic_convolution_1x1_single_packed_channel_fp16) {
                                { 1,4,2,2 },
                                0, 0.0f,
                                data_types::f16,
+                               "",
                                padding{ { 0,0,0,0 }, 0 })
     );
 
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/concatenation_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/concatenation_gpu_test.cpp
index ca80202bb5c..444e1cde280 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/concatenation_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/concatenation_gpu_test.cpp
@@ -63,6 +63,7 @@ TEST(concat_gpu, mixed_input_types) {
                           { "input0", "input1", "input2", "input3", "input4" },
                           concatenation::concatenation_axis::along_f,
                           data_types::f32,
+                          "",
                           padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -136,6 +137,7 @@ TEST(concat_gpu, mixed_input_types_5d) {
                           { "input0", "input1", "input2", "input3" },
                           concatenation::concatenation_axis::along_f,
                           data_types::f32,
+                          "",
                           padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -210,6 +212,7 @@ TEST(concat_gpu, i8_optimization_with_pool) {
                                     {"pool0", "pool1"},
                                     concatenation::concatenation_axis::along_f,
                                     data_types::i8,
+                                    "",
                                     padding{{0, 0, 0, 0}, 0}),
                       reorder("reorder", "concat", reorder_layout));
     cldnn::build_options options;
@@ -310,6 +313,7 @@ TEST(concat_gpu, i8_optimization_with_conv) {
                                     {"input0", "input1", "input2"},
                                     concatenation::concatenation_axis::along_f,
                                     data_types::i8,
+                                    "",
                                     padding{{0, 0, 0, 0}, 0}),
                       data("weights", weights),
                       convolution("conv", "concat", { "weights" }, { 1,1,1,2 }),
@@ -411,6 +415,7 @@ TEST(concat_gpu, i8_optimization_with_pool_conv) {
                                     {"pool0", "pool1"},
                                     concatenation::concatenation_axis::along_f,
                                     data_types::i8,
+                                    "",
                                     padding{{0, 0, 0, 0}, 0}),
                       data("weights", weights),
                       convolution("conv", "concat", {"weights"}, {1, 1, 1, 1}, {0, 0, -1, 0}),
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/convolution_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/convolution_gpu_test.cpp
index 24cff72146b..5da5c16c359 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/convolution_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/convolution_gpu_test.cpp
@@ -1558,6 +1558,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_input_padding) {
             { 1,1,1,1 },
             { 0,0,-1,-2 },
             { 1, 1, 1, 1 },
+            "",
             padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -1660,6 +1661,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_sym_input_padding) {
             { 1, 1, 1, 1 },
             { 0,0,1,2 },
             { 0,0,1,2 },
+            "",
             padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -1757,6 +1759,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_asym_input_padding) {
             { 1, 1, 1, 1 },
             { 0,0,1,2 },
             { 0,0,2,3 },
+            "",
             padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -1864,6 +1867,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_sym_input_padding_with_input_offs
             { 1, 1, 1, 1 },
             { 0,0,1,2 },
             { 0,0,1,2 },
+            "",
             padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -1974,6 +1978,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_asym_input_padding_with_input_off
             { 1, 1, 1, 1 },
             { 0,0,1,2 },
             { 0,0,2,3 },
+            "",
             padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -2072,6 +2077,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_input_and_output_padding) {
             { 1,1,1,1 },
             { 0,0,-1,-2 },
             { 1, 1, 1, 1 },
+            "",
             padding{ { 0,0,-x_pad,-y_pad }, 0 })
     );
 
@@ -2637,6 +2643,7 @@ TEST(convolution_f32_fw_gpu, offsets_wsiz3x3_wstr2x2_in2x2x1x1_zeropad) {
             { 1,1,2,2 },
             { 0,0,-1,-1 },
             { 1, 1, 1, 1 },
+            "",
             padding{ { 0,0,1,1 }, 0 })
     );
 
@@ -5498,7 +5505,7 @@ TEST(convolution_f32_fw_gpu, convolution_int8_b_fs_yx_fsv4_to_bfyx) {
         reorder("to_int", "input", { data_types::i8,format::bfyx,{ batch_num, input_f, input_size_x, input_size_y } }),
         data("weights", weights),
         data("biases", biases),
-        convolution("conv", "to_int", { "weights" }, { "biases" }, { 1, 1, 1, 1 }, { 0, 0, -2, -2 }, { 1,1,1,1 },
+        convolution("conv", "to_int", { "weights" }, { "biases" }, { 1, 1, 1, 1 }, { 0, 0, -2, -2 }, { 1, 1, 1, 1 }, "",
             padding{ { 0, 0, output_padding, output_padding }, 0 }),
         reorder("output", "conv", { data_types::f32,format::bfyx,{ batch_num, input_f, input_size_x, input_size_y } }));
 
@@ -5520,7 +5527,7 @@ TEST(convolution_f32_fw_gpu, convolution_int8_b_fs_yx_fsv4_to_bfyx) {
         reorder("to_int", "input", { data_types::i8,format::b_fs_yx_fsv4,{ batch_num, input_f, input_size_x, input_size_y } }),
         data("weights", weights),
         data("biases", biases),
-        convolution("conv", "to_int", { "weights" }, { "biases" }, { 1, 1, 1, 1 }, { 0, 0, -2, -2 }, { 1,1,1,1 },
+        convolution("conv", "to_int", { "weights" }, { "biases" }, { 1, 1, 1, 1 }, { 0, 0, -2, -2 }, { 1, 1, 1, 1 }, "",
             padding{ { 0, 0, output_padding, output_padding }, 0 }),
         reorder("output", "conv", { data_types::f32,format::bfyx,{ batch_num, input_f, input_size_x, input_size_y } }));
 
@@ -8615,12 +8622,12 @@ public:
         all_layer_params.emplace_back(new convolution("convolution_no_relu", "reorder0", weights, bias, stride_sizes[3], input_offset_sizes[3], dilation_sizes[3]));
 
         // Output padding
-        all_layer_params.emplace_back(new convolution("convolution_no_relu", "input0", weights, bias, stride_sizes[1], input_offset_sizes[1], dilation_sizes[1], { { 0, 0, 2, 4 },{ 0, 0, 0, 19 } }));
-        all_layer_params.emplace_back(new convolution("convolution_no_relu", "input0", weights, bias, stride_sizes[2], input_offset_sizes[2], dilation_sizes[2], { { 0, 0, 1, 0 },{ 0, 0, 13, 9 } }));
+        all_layer_params.emplace_back(new convolution("convolution_no_relu", "input0", weights, bias, stride_sizes[1], input_offset_sizes[1], dilation_sizes[1], "", { { 0, 0, 2, 4 }, { 0, 0, 0, 19 } }));
+        all_layer_params.emplace_back(new convolution("convolution_no_relu", "input0", weights, bias, stride_sizes[2], input_offset_sizes[2], dilation_sizes[2], "", { { 0, 0, 1, 0 }, { 0, 0, 13, 9 } }));
 
         // Input + Output padding
-        all_layer_params.emplace_back(new convolution("convolution_no_relu", "reorder0", weights, bias, stride_sizes[0], input_offset_sizes[0], dilation_sizes[0], { { 0, 0, 1, 5 },{ 0, 0, 19, 4 } }));
-        all_layer_params.emplace_back(new convolution("convolution_no_relu", "reorder0", weights, bias, stride_sizes[3], input_offset_sizes[3], dilation_sizes[3], { { 0, 0, 1, 2 },{ 0, 0, 3, 4 } }));
+        all_layer_params.emplace_back(new convolution("convolution_no_relu", "reorder0", weights, bias, stride_sizes[0], input_offset_sizes[0], dilation_sizes[0], "", { { 0, 0, 1, 5 }, { 0, 0, 19, 4 } }));
+        all_layer_params.emplace_back(new convolution("convolution_no_relu", "reorder0", weights, bias, stride_sizes[3], input_offset_sizes[3], dilation_sizes[3], "", { { 0, 0, 1, 2 }, { 0, 0, 3, 4 } }));
 
         return all_layer_params;
     }
@@ -8853,3 +8860,210 @@ INSTANTIATE_TEST_SUITE_P(DISABLED_CONVOLUTION,
                         convolution_test,
                         ::testing::ValuesIn(convolution_test::generate_all_test_params()),
                         tests::generic_test::custom_param_name_functor());
+
+
+#ifdef ENABLE_ONEDNN_FOR_GPU
+using TestParamType_convolution_gpu_onednn = ::testing::tuple<  int,    // 0 - Input X size
+        int,            // 1  - Input Y size
+        int,            // 2  - Input Z size
+        int,            // 3  - Input features
+        int,            // 4  - Output features
+        int,            // 5  - Kernel sizeX
+        int,            // 6  - Kernel sizeY
+        int,            // 7  - Kernel sizeZ
+        int,            // 8  - Groups number
+        int,            // 9  - Stride
+        int,            // 10 - Batch
+        format,         // 11 - Input data format
+        std::string,    // 12 - Implementation name
+        impl_types,     // 13 - Implementation type
+        bool>;          // 14 - With bias
+
+struct convolution_gpu_onednn : public ::testing::TestWithParam<TestParamType_convolution_gpu_onednn> {
+    static std::string PrintToStringParamName(
+        testing::TestParamInfo<TestParamType_convolution_gpu_onednn> param_info) {
+        // construct a readable name
+        std::string res = "in" + std::to_string(testing::get<0>(param_info.param)) + "x" +
+                          std::to_string(testing::get<1>(param_info.param)) + "y" +
+                          std::to_string(testing::get<2>(param_info.param)) + "z" +
+                          std::to_string(testing::get<3>(param_info.param)) + "f" + "_output" +
+                          std::to_string(testing::get<4>(param_info.param)) + "f" + "_filter" +
+                          std::to_string(testing::get<5>(param_info.param)) + "x" +
+                          std::to_string(testing::get<6>(param_info.param)) + "y" +
+                          std::to_string(testing::get<7>(param_info.param)) + "z" + "_groups" +
+                          std::to_string(testing::get<8>(param_info.param)) + "_stride" +
+                          std::to_string(testing::get<9>(param_info.param)) + "_batch" +
+                          std::to_string(testing::get<10>(param_info.param)) + "_format" +
+                          std::to_string(testing::get<11>(param_info.param)) + "_with_bias_" +
+                          std::to_string(testing::get<14>(param_info.param));
+
+        if (testing::get<12>(param_info.param) != "") {
+            res += "_kernel_" + testing::get<12>(param_info.param);
+        }
+
+        auto impl_type = testing::get<13>(param_info.param);
+        if (impl_type == impl_types::onednn)
+            res += "_onednn_impl";
+        else if (impl_type == impl_types::ocl)
+            res += "_ocl_impl";
+
+        return res;
+    }
+};
+
+INSTANTIATE_TEST_SUITE_P(conv_onednn_cases,
+                        convolution_gpu_onednn,
+                        ::testing::Values(
+                            // Input X size, Input Y size, Input Z size, Input features, Output features,
+                            // Kernel size X, Kernel size Y, Kernel size Z, Groups number, Stride, Batch,
+                            // Input data format, Implementation name, WithBias
+                            TestParamType_convolution_gpu_onednn(8, 8, 1, 32, 32, 3, 3, 1, 1, 1, 32, format::bfyx, "", impl_types::onednn, true),
+                            TestParamType_convolution_gpu_onednn(8, 8, 1, 32, 32, 3, 3, 1, 1, 1, 32, format::bfyx, "", impl_types::onednn, false)
+                            // TestParamType_convolution_gpu_onednn(8, 8, 1, 32, 32, 3, 3, 1, 1, 1, 32, format::bfyx, "", impl_types::onednn, true),
+                            // TestParamType_convolution_gpu_onednn(8, 8, 1, 32, 32, 3, 3, 1, 1, 1, 32, format::bfyx, "", impl_types::onednn, false)
+                        ),
+                        convolution_gpu_onednn::PrintToStringParamName);
+
+
+TEST_P(convolution_gpu_onednn, conv_onednn_cases) {
+    auto& engine = get_onednn_test_engine();
+
+    if (!engine.get_device_info().supports_fp16)
+    {
+        std::cout << "[ SKIPPED ] The test is skipped (cl_khr_fp16 is not supported)." << std::endl;
+        EXPECT_EQ(1, 1);
+        return;
+    }
+
+    const int input_x = testing::get<0>(GetParam()),
+              input_y = testing::get<1>(GetParam()),
+              input_f = testing::get<3>(GetParam()),
+              output_f = testing::get<4>(GetParam()),
+              filter_x = testing::get<5>(GetParam()),
+              filter_y = testing::get<6>(GetParam()),
+              groups = testing::get<8>(GetParam()),
+              stride = testing::get<9>(GetParam()),
+              batch_num = testing::get<10>(GetParam());
+    auto input_data_format = testing::get<11>(GetParam());
+    auto impl_name = testing::get<12>(GetParam());
+    auto prim_impl_types = testing::get<13>(GetParam());
+    auto with_bias = testing::get<14>(GetParam());
+
+    auto input_size = tensor(batch_num, input_f, input_x, input_y);
+    auto input_data = generate_random_4d<FLOAT16>(batch_num, input_f, input_y, input_x, -1, 1);
+    auto input_data_bfyx = flatten_4d(format::bfyx, input_data);
+    auto input_mem = engine.allocate_memory({ data_types::f16, format::bfyx, input_size });
+    set_values(input_mem, input_data_bfyx);
+
+    auto weights_size = tensor(output_f, input_f, filter_y, filter_x, 1);
+    auto weights_data = generate_random_4d<FLOAT16>(output_f, input_f, filter_y, filter_x, -1, 1);
+    auto weights_data_bfyx = flatten_4d(format::bfyx, weights_data);
+    auto weights_mem = engine.allocate_memory({data_types::f16, format::bfyx, weights_size});
+    set_values(weights_mem, weights_data_bfyx);
+
+    // Will be used to store reference values calculated in branches depending on bias
+    auto expected_result = VVVVF<FLOAT16>(batch_num, VVVF<FLOAT16>(output_f));
+    topology topology;
+
+    // Calculate reference values
+    if (with_bias) {
+        auto biases_size = tensor(1, output_f, 1, 1);
+        auto biases_data = generate_random_1d<FLOAT16>(output_f, -1, 1);
+        auto biases_mem = engine.allocate_memory({data_types::f16, format::bfyx, biases_size});
+        set_values(biases_mem, biases_data);
+
+        for (auto bi = 0; bi < batch_num; ++bi) {
+            for (auto ofi = 0; ofi < output_f; ++ofi) {
+                expected_result[bi][ofi] = reference_convolve(input_data[bi],                    // input
+                                                              weights_data[ofi],                 // weights
+                                                              stride, stride,                    // strides
+                                                              biases_data[ofi],                  // bias
+                                                              1, 1,                              // dilation
+                                                              0, 0,  // input padding
+                                                              0, 0);   // output_padding
+            }
+        }
+
+        topology.add(input_layout("input", input_mem->get_layout()),
+                     data("weights_fsv", weights_mem),
+                     data("bias", biases_mem),
+                     reorder("input_fsv", "input", {data_types::f16, input_data_format, input_size}));
+
+        auto conv_fsv = convolution("conv_fsv",
+                                    "input_fsv",
+                                    {"weights_fsv"},
+                                    {"bias"},
+                                    groups,
+                                    {1, 1, stride, stride},
+                                    {0, 0, 0, 0});
+        conv_fsv.output_padding = padding({0, 0, 0, 0}, 0.f);
+
+        topology.add(conv_fsv);
+    } else {
+        for (auto bi = 0; bi < batch_num; ++bi) {
+            for (auto ofi = 0; ofi < output_f; ++ofi) {
+                expected_result[bi][ofi] = reference_convolve(input_data[bi],                    // input
+                                                              weights_data[ofi],                 // weights
+                                                              stride, stride,                    // strides
+                                                              0,                                 // bias
+                                                              1, 1,                              // dilation
+                                                              0, 0,  // input padding
+                                                              0, 0);   // output_padding
+            }
+        }
+
+        topology.add(input_layout("input", input_mem->get_layout()),
+                     data("weights_fsv", weights_mem),
+                     reorder("input_fsv", "input", {data_types::f16, input_data_format, input_size}));
+
+        auto conv_fsv = convolution("conv_fsv",
+                                    "input_fsv",
+                                    {"weights_fsv"},
+                                    groups,
+                                    {1, 1, stride, stride},
+                                    {0, 0, 0, 0});
+        conv_fsv.output_padding = padding({0, 0, 0, 0}, 0.f);
+        topology.add(conv_fsv);
+    }
+    build_options options;
+    options.set_option(build_option::optimize_data(true));
+    implementation_desc conv_impl = {input_data_format, impl_name, prim_impl_types};
+    options.set_option(build_option::force_implementations({{"conv_fsv", conv_impl}}));
+    network network(engine, topology, options);
+
+    network.set_input_data("input", input_mem);
+    network.execute();
+
+    for (auto& p : network.get_primitives_info())
+        std::cerr << p.original_id << " " << p.kernel_id << std::endl;
+
+    auto out_mem = network.get_output("conv_fsv").get_memory();
+    mem_lock<FLOAT16> out_ptr{out_mem, get_test_stream()};
+    auto out_lay = out_mem->get_layout();
+
+    ASSERT_EQ(out_mem->get_layout().format, input_data_format);
+    ASSERT_EQ(out_lay.size.batch[0], expected_result.size());
+    ASSERT_EQ(out_lay.size.feature[0], expected_result[0].size());
+    ASSERT_EQ(out_lay.size.spatial[1], expected_result[0][0].size());
+    ASSERT_EQ(out_lay.size.spatial[0], expected_result[0][0][0].size());
+
+    for (int bi = 0; bi < out_lay.size.batch[0]; ++bi)
+        for (int ofi = 0; ofi < out_lay.size.feature[0]; ++ofi)
+            for (int yi = 0; yi < out_lay.size.spatial[1]; ++yi)
+                for (int xi = 0; xi < out_lay.size.spatial[0]; ++xi) {
+                    tensor coords = tensor(batch(bi), feature(ofi), spatial(xi, yi, 0, 0));
+                    auto offset = out_lay.get_linear_offset(coords);
+                    auto val = out_ptr[offset];
+                    auto val_ref = expected_result[bi][ofi][yi][xi];
+                    auto equal = are_equal(val_ref, val, 1);
+                    if (!equal) {
+                        std::cout << "Value at batch: " << bi << ", output_f: " << ofi
+                                    << ", y: " << yi << ", x: " << xi << " = " << static_cast<float>(val) << std::endl;
+                        std::cout << "Reference value at batch: " << bi << ", output_f: " << ofi << ", y: " << yi
+                                  << ", x: " << xi << " = " << static_cast<float>(val_ref) << std::endl;
+                    }
+                    EXPECT_TRUE(equal);
+                }
+}
+
+#endif   // ENABLE_ONEDNN_FOR_GPU
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/eltwise_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/eltwise_gpu_test.cpp
index 6fcd3aecb55..4a2281afa13 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/eltwise_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/eltwise_gpu_test.cpp
@@ -96,7 +96,7 @@ void generic_eltwise_test(cldnn::format test_input_fmt, int input_b, int input_f
     topology.add(input_layout("input1", input1->get_layout()));
     topology.add(input_layout("input2", input2->get_layout()));
     topology.add(reorder("reorder1", "input1", input1->get_layout().with_padding(padding{{ 0, 0, input_padding_x, input_padding_y }, 0 })));
-    topology.add(eltwise("eltwise", {"reorder1", "input2"}, mode, padding{ { 0, 0, output_padding_x, output_padding_y }, 0 }));
+    topology.add(eltwise("eltwise", {"reorder1", "input2"}, mode, "", padding{ { 0, 0, output_padding_x, output_padding_y }, 0 }));
     primitive_id out_id = "eltwise";
     if (relu)
     {
@@ -2660,7 +2660,7 @@ TEST(eltwise_gpu_f16, bfyx_and_fs_b_yx_fsv32_output_padding) {
     topology golden_topology;
     golden_topology.add(input_layout("input1", input1->get_layout()));
     golden_topology.add(input_layout("input2", input2->get_layout()));
-    golden_topology.add(eltwise("eltwise", "input1", "input2", eltwise_mode::sum, padding{ {0,0,5,10} , 0 }));
+    golden_topology.add(eltwise("eltwise", "input1", "input2", eltwise_mode::sum, "", padding{ {0,0,5,10} , 0 }));
 
     network golden_network(engine, golden_topology);
     golden_network.set_input_data("input1", input1);
@@ -2676,7 +2676,7 @@ TEST(eltwise_gpu_f16, bfyx_and_fs_b_yx_fsv32_output_padding) {
     FS_B_YX_FSV32_OUTPUT_topology.add(input_layout("input2", input2->get_layout()));
     FS_B_YX_FSV32_OUTPUT_topology.add(reorder("reorder1", "input1", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor)));
     FS_B_YX_FSV32_OUTPUT_topology.add(reorder("reorder2", "input2", layout(data_types::f16, format::byxf, input_tensor)));
-    FS_B_YX_FSV32_OUTPUT_topology.add(eltwise("eltwise", "reorder1", "reorder2", eltwise_mode::sum, padding{ {0,0,5,10} , 0 }));
+    FS_B_YX_FSV32_OUTPUT_topology.add(eltwise("eltwise", "reorder1", "reorder2", eltwise_mode::sum, "", padding{ {0,0,5,10} , 0 }));
     FS_B_YX_FSV32_OUTPUT_topology.add(reorder("reorderOutput", "eltwise", layout(data_types::f16, format::bfyx, input_tensor,
                                               padding{ {0,0,5,10} , 0 })));
 
@@ -2694,7 +2694,7 @@ TEST(eltwise_gpu_f16, bfyx_and_fs_b_yx_fsv32_output_padding) {
     BYXF_OUTPUT_topology.add(input_layout("input2", input2->get_layout()));
     BYXF_OUTPUT_topology.add(reorder("reorder1", "input1", layout(data_types::f16, format::byxf, input_tensor)));
     BYXF_OUTPUT_topology.add(reorder("reorder2", "input2", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor)));
-    BYXF_OUTPUT_topology.add(eltwise("eltwise", "reorder1", "reorder2", eltwise_mode::sum, padding{ {0,0,5,10} , 0 }));
+    BYXF_OUTPUT_topology.add(eltwise("eltwise", "reorder1", "reorder2", eltwise_mode::sum, "", padding{ {0,0,5,10} , 0 }));
     BYXF_OUTPUT_topology.add(reorder("reorderOutput", "eltwise", layout(data_types::f16, format::bfyx, input_tensor,
                                      padding{ {0,0,5,10} , 0 })));
 
@@ -2876,7 +2876,7 @@ void generic_eltwise_bool_test(cldnn::format test_input_fmt, int input_b, int in
     topology.add(input_layout("input1", input1->get_layout()));
     topology.add(input_layout("input2", input2->get_layout()));
     topology.add(reorder("reorder1", "input1", input1->get_layout().with_padding(padding{{ 0, 0, input_padding_x, input_padding_y }, 0 })));
-    topology.add(eltwise("eltwise", {"reorder1", "input2"}, mode, padding{ { 0, 0, output_padding_x, output_padding_y }, 0 }));
+    topology.add(eltwise("eltwise", {"reorder1", "input2"}, mode, "", padding{ { 0, 0, output_padding_x, output_padding_y }, 0 }));
 
     network network(engine, topology);
     network.set_input_data("input1", input1);
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/fusings_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/fusings_gpu_test.cpp
index e2996495262..903d7e18bab 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/fusings_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/fusings_gpu_test.cpp
@@ -1093,6 +1093,7 @@ TEST_P(conv_fp32_multi_eltwise_concat, basic) {
             {"eltwise1", "eltwise2"},
             concatenation::concatenation_axis::along_f,
             data_types::i8,
+            "",
             padding{{0, 0, 0, 0}, 0}),
         reorder("reorder_bfyx", "concat", p.default_format, data_types::f32)
     );
@@ -2828,7 +2829,7 @@ TEST_P(fc_fp32_activation, basic) {
     create_topologies(input_layout("input", get_input_layout(p)),
                 data("weights", get_mem(get_fc_weights_layout(p))),
                 data("bias", get_mem(get_fc_bias_layout(p))),
-                fully_connected("fc_prim", "input", "weights", "bias", padding(), get_fc_output_dim_size(p)),
+                fully_connected("fc_prim", "input", "weights", "bias", "", padding(), get_fc_output_dim_size(p)),
                 activation("activation", "fc_prim", activation_func::abs),
                 reorder("reorder_bfyx", "activation", p.default_format, data_types::f32)
     );
@@ -2874,7 +2875,7 @@ TEST_P(fc_int8_scale, basic) {
         data("weights", get_mem(get_fc_weights_layout(p))),
         data("bias", get_mem(get_fc_bias_layout(p))),
         data("scale_data", get_mem(get_per_channel_layout(p), 1.0f / p.kernel.count())),
-        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, padding(), get_fc_output_dim_size(p)),
+        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, "", padding(), get_fc_output_dim_size(p)),
         scale("scale", "fc_prim", "scale_data"),
         reorder("reorder_bfyx", "scale", p.default_format, data_types::f32)
     );
@@ -2889,7 +2890,7 @@ TEST_P(fc_int8_scale, fp16_scale_out) {
         data("weights", get_mem(get_fc_weights_layout(p))),
         data("bias", get_mem(get_fc_bias_layout(p))),
         data("scale_data", get_mem(get_per_channel_layout(p), 1.0f / p.kernel.count())),
-        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, padding(), get_fc_output_dim_size(p)),
+        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, "", padding(), get_fc_output_dim_size(p)),
         scale("scale", "fc_prim", "scale_data", optional_data_type{data_types::f16}),
         reorder("reorder_bfyx", "scale", p.default_format, data_types::f32)
     );
@@ -2918,7 +2919,7 @@ TEST_P(fc_int8_quantize_u8, basic) {
         data("in_hi", get_mem(get_per_channel_layout(p), 1, max_random)),
         data("out_lo", get_mem(get_single_element_layout(p), 0)),
         data("out_hi", get_mem(get_single_element_layout(p), 255)),
-        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, padding(), get_fc_output_dim_size(p)),
+        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, "", padding(), get_fc_output_dim_size(p)),
         quantize("quantize", "fc_prim", "in_lo", "in_hi", "out_lo", "out_hi", 256, data_types::u8),
         reorder("reorder_bfyx", "quantize", p.default_format, data_types::f32)
     );
@@ -2948,7 +2949,7 @@ TEST_P(fc_int8_scale_quantize_i8, basic) {
         data("out_lo", get_mem(get_single_element_layout(p), -127)),
         data("out_hi", get_mem(get_single_element_layout(p), 127)),
         data("scale_data", get_mem(get_per_channel_layout(p), 1.0f / p.kernel.count() / 255)),
-        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, padding(), get_fc_output_dim_size(p)),
+        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, "", padding(), get_fc_output_dim_size(p)),
         scale("scale", "fc_prim", "scale_data"),
         quantize("quantize", "scale", "in_lo", "in_hi", "out_lo", "out_hi", 255, data_types::i8),
         reorder("reorder_bfyx", "quantize", p.default_format, data_types::f32)
@@ -2980,7 +2981,7 @@ TEST_P(fc_int8_scale_activation_quantize_i8, basic) {
         data("out_lo", get_mem(get_single_element_layout(p), -127)),
         data("out_hi", get_mem(get_single_element_layout(p), 127)),
         data("scale_data", get_mem(get_per_channel_layout(p), 1.0f / p.kernel.count() / 255)),
-        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, padding(), get_fc_output_dim_size(p)),
+        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, "", padding(), get_fc_output_dim_size(p)),
         scale("scale", "fc_prim", "scale_data"),
         activation("activation_scale", "scale", activation_func::exp),
         quantize("quantize", "activation_scale", "in_lo", "in_hi", "out_lo", "out_hi", 255, data_types::i8),
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/max_unpooling_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/max_unpooling_gpu_test.cpp
index 0cb3c2cb828..5bf6f5784dd 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/max_unpooling_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/max_unpooling_gpu_test.cpp
@@ -63,7 +63,7 @@ TEST(max_unpooling_gpu, basic_in2x3x2x2) {
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
     topology.add(data("arg_max", arg_max));
-    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
+    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, ""));
 
     network network(engine, topology);
 
@@ -145,7 +145,7 @@ TEST(max_unpooling_gpu, basic_in2x3x2x2_output_padding) {
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
     topology.add(data("arg_max", arg_max));
-    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, padding({ 0, 0, 1, 1 }, 0)));
+    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, "", padding({ 0, 0, 1, 1 }, 0)));
 
     network network(engine, topology);
 
@@ -317,7 +317,7 @@ TEST(max_unpooling_gpu, basic_in2x3x2x2_fp16) {
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
     topology.add(data("arg_max", arg_max));
-    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
+    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, ""));
 
     network network(engine, topology);
 
@@ -395,7 +395,7 @@ TEST(max_unpooling_gpu, basic_in2x2x3x2_max_with_argmax_pooling_unpooling) {
     topology.add(input_layout("input", input->get_layout()));
     topology.add(mutable_data("arg_max", arg_max));
     topology.add(pooling("pooling_max_with_argmax", "input", "arg_max", pooling_mode::max_with_argmax, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
-    topology.add(max_unpooling("max_unpooling", "pooling_max_with_argmax", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
+    topology.add(max_unpooling("max_unpooling", "pooling_max_with_argmax", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, ""));
 
     network network(engine, topology);
 
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/pooling_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/pooling_gpu_test.cpp
index 0443137e933..24a7f7ad9cf 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/pooling_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/pooling_gpu_test.cpp
@@ -225,7 +225,7 @@ TEST(pooling_forward_gpu, basic_max_byxf_f32_wsiz3x3_wstr1x1_i1x3x3x8_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,3,3 }, { 1,1,1,1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 3, 3 }, { 1, 1, 1, 1 }));
     network network(engine, topology);
     set_values(input_prim, { 0.5f, -0.5f, -0.5f, -0.5f, 0.5f, -0.5f, -0.5f, -0.5f,
         1.0f, 0.0f, 0.0f, 0.0f, 0.5f, -0.5f, -0.5f, -0.5f,
@@ -270,7 +270,7 @@ TEST(pooling_forward_gpu, basic_max_yxfb_f32_wsiz3x3_wstr1x1_i3x3x1x1_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,3,3 }, { 1,1,1,1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 3, 3 }, { 1, 1, 1, 1 }));
 
     network network(engine, topology);
     set_values(input_prim, { -0.5f, 1.0f, 0.5f, 2.0f, 1.5f, -0.5f, 0.0f, -1.0f, 0.5f });
@@ -425,9 +425,9 @@ TEST(pooling_forward_gpu, basic_avg_b_fs_yx_fsv16_i8_global_i3x3x1x1_nopad) {
 TEST(pooling_forward_gpu, basic_max_pooling_int8) {
 
     auto& engine = get_test_engine();
-    layout in_layout = { type_to_data_type<float>::value,format::byxf,{ 1,1,3,3 } };
-    layout out_layout = { type_to_data_type<float>::value,format::byxf,{ 1,1,1,1 } };
-    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx,{ 1,1,3,3 } };
+    layout in_layout = { type_to_data_type<float>::value, format::byxf, { 1, 1, 3, 3 } };
+    layout out_layout = { type_to_data_type<float>::value, format::byxf, { 1, 1, 1, 1 } };
+    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx, { 1, 1, 3, 3 } };
     std::initializer_list<float> input_f = { 1.0f, -2.5f, 3.1f, -4.0f, 5.03f, -6.99f, 7.0f, -8.0f, 9.5f };
     std::list<float> final_results = { 10.0f };
 
@@ -444,7 +444,7 @@ TEST(pooling_forward_gpu, basic_max_pooling_int8) {
         input,
         // 2. reorder primitive with id "reorder_input"
         reorder("reorder_input", input, byte_layout),
-        pooling("pool1", "reorder_input", pooling_mode::max, { 1,1,3,3 }, {1,1,1,1}),
+        pooling("pool1", "reorder_input", pooling_mode::max, { 1, 1, 3, 3 }, {1, 1, 1, 1}),
         reorder("reorder2", "pool1", out_layout)
     );
 
@@ -471,9 +471,9 @@ TEST(pooling_forward_gpu, basic_max_pooling_int8) {
 TEST(pooling_forward_gpu, basic_avg_pooling_int8) {
 
     auto& engine = get_test_engine();
-    layout in_layout = { type_to_data_type<float>::value,format::byxf,{ 1,1,3,3 } };
-    layout out_layout = { type_to_data_type<float>::value,format::byxf,{ 1,1,1,1 } };
-    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx,{ 1,1,3,3 } };
+    layout in_layout = { type_to_data_type<float>::value, format::byxf, { 1, 1, 3, 3 } };
+    layout out_layout = { type_to_data_type<float>::value, format::byxf, { 1, 1, 1, 1 } };
+    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx, { 1, 1, 3, 3 } };
     std::initializer_list<float> input_f = { 2.0f, -2.5f, 5.1f, -4.0f, 8.03f, -6.99f, 17.0f, -8.0f, 19.5f };
     // Average pooling returns fp32 by default for int8 inputs
     auto final_result = 0.0f;
@@ -496,7 +496,7 @@ TEST(pooling_forward_gpu, basic_avg_pooling_int8) {
         input,
         // 2. reorder primitive with id "reorder_input"
         reorder("reorder_input", input, byte_layout),
-        pooling("pool1", "reorder_input", pooling_mode::average, { 1,1,3,3 }, { 1,1,1,1 }),
+        pooling("pool1", "reorder_input", pooling_mode::average, { 1, 1, 3, 3 }, { 1, 1, 1, 1 }),
         reorder("reorder2", "pool1", out_layout)
     );
 
@@ -539,7 +539,7 @@ TEST(pooling_forward_gpu, basic_max_yxfb_f32_wsiz2x2_wstr1x1_i3x3x1x1_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,1,1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
 
     network network(engine, topology);
     set_values(input_prim, { -0.5f, 1.0f, 0.5f, 2.0f, 1.5f, -0.5f, 0.0f, -1.0f, 0.5f });
@@ -583,7 +583,7 @@ TEST(pooling_forward_gpu, basic_max_yxfb_f32_wsiz2x2_wstr2x2_i4x4x1x1_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }));
 
     network network(engine, topology);
     set_values(input_prim, { -0.25f, 1.00f, 0.50f, 0.25f, 2.00f, 1.50f, -0.50f, -0.75f, 0.00f, -1.00f, 0.50f, 0.25f, 0.50f, -2.00f, -1.50f, -2.50f });
@@ -637,7 +637,7 @@ TEST(pooling_forward_gpu, basic_max_yxfb_f32_wsiz2x2_wstr1x1_i3x3x2x2_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,1,1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
 
     network network(engine, topology);
     set_values(input_prim, { -0.5f, 0.5f, -1.5f, 0.0f, 0.5f, 0.0f, -0.5f, 0.5f, 0.0f, -0.5f, 0.0f, -0.5f, 1.0f, -2.0f, 0.0f, 1.0f, -1.0f, -1.0f, -1.0f, -1.0f, -2.0f, 1.0f, 1.5f, 0.0f, -1.0f, -0.5f, -2.0f, 0.5f, -0.5f, -1.0f, 1.0f, -0.5f, -0.5f, 1.5f, -0.5f, 0.0f });
@@ -687,7 +687,7 @@ TEST(pooling_forward_gpu, offsets_max_yxfb_f32_wsiz2x2_wstr2x2_i2x2x1x1_zeropad)
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0, 0, -1,-1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1,-1 }));
 
     network network(engine, topology);
     set_values(input_prim, { 1.50f, -0.50f, -1.00f, 0.50f });
@@ -732,7 +732,7 @@ TEST(pooling_forward_gpu, offsets_max_yxfb_f32_wsiz2x2_wstr2x2_i3x3x1x1_zeropad)
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }));
 
     network network(engine, topology);
 
@@ -781,7 +781,7 @@ TEST(pooling_forward_gpu, basic_avg_yxfb_f32_wsiz2x2_wstr1x1_i3x3x1x1_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average,{ 1,1,2,2 },{ 1,1,1,1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average,{ 1, 1, 2, 2 },{ 1, 1, 1, 1 }));
 
     network network(engine, topology);
     set_values(input_prim, { -0.5f, 1.0f, 0.5f, 2.0f, 1.5f, -0.5f, 4.0f, -1.0f, 3.5f });
@@ -826,7 +826,7 @@ TEST(pooling_forward_gpu, offsets_avg_yxfb_f32_wsiz2x2_wstr2x2_i2x2x1x1_zeropad)
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }));
 
     network network(engine, topology);
     set_values(input_prim, { 1.5f, -0.5f, -1.0f, 0.5f });
@@ -867,11 +867,11 @@ TEST(pooling_forward_gpu, offsets_avg_bfyx_f32_wsiz3x3_wstr3x3_i1x1x3x3_zeropad)
 
     auto& engine = get_test_engine();
 
-    auto input_prim = engine.allocate_memory({ data_types::f32, format::bfyx,{ 1, 1, 3, 3 } });
+    auto input_prim = engine.allocate_memory({ data_types::f32, format::bfyx, { 1, 1, 3, 3 } });
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1,1,3,3 }, { 1,1,3,3 }, { 0,0,-1,-1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1, -1, 3, 3 }, { 1, 1, 3, 3 }, { 0, 0, -1, -1 }));
 
     network network(engine, topology);
 
@@ -919,7 +919,7 @@ TEST(pooling_forward_gpu, offsets_avg_yxfb_f32_wsiz2x2_wstr2x2_i3x3x1x1_zeropad)
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }));
 
     network network(engine, topology);
     set_values(input_prim, { 1.5f, -0.5f, 2.5f, -1.0f, 0.5f, 3.0f, 0.5f, 0.0f, -8.0f });
@@ -974,7 +974,7 @@ TEST(pooling_forward_gpu, offsets_avg_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i2x2x1x1_out
 
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
-        topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,2,2 }, 0 }));
+        topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 2, 2 }, 0 }));
 
         network network(engine, topology);
         set_values(input_prim, { 1.5f, -0.5f, -1.0f, 0.5f });
@@ -1035,7 +1035,7 @@ TEST(pooling_forward_gpu, offsets_max_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i3x3x1x1_out
 
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
-        topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,1,1 }, 0 }));
+        topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 1, 1 }, 0 }));
 
         network network(engine, topology);
 
@@ -1106,7 +1106,7 @@ TEST(pooling_forward_gpu, offsets_avg_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i2x2x1x1_inp
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
         topology.add(reorder("reorder", "input_prim", input_prim->get_layout().with_padding(padding{ {0,0,1,2}, 0 })));
-        topology.add(pooling("pool_prim", "reorder", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,2,2 }, 0 }));
+        topology.add(pooling("pool_prim", "reorder", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 2, 2 }, 0 }));
 
         network network(engine, topology);
         set_values(input_prim, { 1.5f, -0.5f, -1.0f, 0.5f });
@@ -1169,7 +1169,7 @@ TEST(pooling_forward_gpu, offsets_max_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i3x3x1x1_inp
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
         topology.add(reorder("reorder", "input_prim", input_prim->get_layout().with_padding(padding{ { 0, 0, 1, 2 }, 0 })));
-        topology.add(pooling("pool_prim", "reorder", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,1,1 }, 0 }));
+        topology.add(pooling("pool_prim", "reorder", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 1, 1 }, 0 }));
 
         network network(engine, topology);
 
@@ -1240,7 +1240,7 @@ TEST(pooling_forward_gpu, avg_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i2x2x1x1_inpad2x1_ou
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
         topology.add(reorder("reorder", "input_prim", input_prim->get_layout().with_padding(padding{ { 0, 0, 2, 1 }, 0 })));
-        topology.add(pooling("pool_prim", "reorder", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,0,0 }, padding{ { 0,0,2,2 }, 0 }));
+        topology.add(pooling("pool_prim", "reorder", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, 0, 0 }, "", padding{ { 0, 0, 2, 2 }, 0 }));
 
         network network(engine, topology);
         set_values(input_prim, {
@@ -1308,7 +1308,7 @@ TEST(pooling_forward_gpu, max_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i3x3x1x1_inpad2x1_ou
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
         topology.add(reorder("reorder", "input_prim", input_prim->get_layout().with_padding(padding{ { 0, 0, 2, 1 }, 0 })));
-        topology.add(pooling("pool_prim", "reorder", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,1,1 }, 0 }));
+        topology.add(pooling("pool_prim", "reorder", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 1, 1 }, 0 }));
 
         network network(engine, topology);
 
@@ -1366,8 +1366,8 @@ TEST(pooling_forward_gpu, basic_in2x2x3x2_max_with_argmax) {
 
     auto& engine = get_test_engine();
 
-    auto input = engine.allocate_memory({ data_types::f32, format::bfyx,{ 2, 2, 3, 2 } });
-    auto arg_max = engine.allocate_memory({ data_types::f32, format::bfyx,{ 2, 2, 2, 1 } });
+    auto input = engine.allocate_memory({ data_types::f32, format::bfyx, { 2, 2, 3, 2 } });
+    auto arg_max = engine.allocate_memory({ data_types::f32, format::bfyx, { 2, 2, 2, 1 } });
 
     set_values(input, {
         1.0f, 2.0f, -10.f,
@@ -1443,8 +1443,8 @@ TEST(pooling_forward_gpu, basic_in2x2x3x2x1_max_with_argmax) {
 
     auto& engine = get_test_engine();
 
-    auto input = engine.allocate_memory({ data_types::f32, format::bfzyx,{ 2, 2, 3, 2, 1 } });
-    auto arg_max = engine.allocate_memory({ data_types::f32, format::bfzyx,{ 2, 2, 2, 1, 1 } });
+    auto input = engine.allocate_memory({ data_types::f32, format::bfzyx, { 2, 2, 3, 2, 1 } });
+    auto arg_max = engine.allocate_memory({ data_types::f32, format::bfzyx, { 2, 2, 2, 1, 1 } });
 
     set_values(input, {
         1.0f, 2.0f, -10.f,
@@ -1619,7 +1619,7 @@ TEST(pooling_forward_gpu, basic_in2x2x3x2_max_with_argmax_output_padding) {
     topology.add(input_layout("input", input->get_layout()));
     topology.add(reorder("reorder", "input", input->get_layout().with_padding(padding{ { 0, 0, 2, 2 }, 0 })));
     topology.add(mutable_data("arg_max", arg_max));
-    topology.add(pooling("pooling", "reorder", "arg_max", pooling_mode::max_with_argmax, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, padding({ 0, 0, 1, 1 }, 0)));
+    topology.add(pooling("pooling", "reorder", "arg_max", pooling_mode::max_with_argmax, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, "", padding({ 0, 0, 1, 1 }, 0)));
 
     network network(engine, topology);
 
@@ -1707,7 +1707,7 @@ TEST(pooling_forward_gpu, basic_in2x2x3x2_max_with_argmax_with_output_size) {
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
     topology.add(mutable_data("arg_max", arg_max));
-    topology.add(pooling("pooling", "input", "arg_max", pooling_mode::max_with_argmax, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, { 2, 2, 2, 1 }));
+    topology.add(pooling("pooling", "input", "arg_max", pooling_mode::max_with_argmax, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, { 2, 2, 2, 1 }, ""));
 
     network network(engine, topology);
 
@@ -2073,8 +2073,8 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_avg_3x3_input_2x2_pool_1x1_stride_2x2_ou
     topology topology;
     topology.add(input_layout("input", input_prim->get_layout()));
     topology.add(reorder("reorder_input", "input", layout(data_types::f16, format::fs_b_yx_fsv32, { 1, 1, 3, 3 })));
-    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1,1,2,2 }, { 1,1,1,1 }));
-    topology.add(reorder("reorder_after_pooling", "avg_pooling", layout(data_types::f16, format::bfyx, { 1,1,2,2 })));
+    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
+    topology.add(reorder("reorder_after_pooling", "avg_pooling", layout(data_types::f16, format::bfyx, { 1, 1, 2, 2 })));
 
     network network(engine, topology);
     set_values(input_prim, { FLOAT16(-0.5f), FLOAT16(1.0f), FLOAT16(0.5f), FLOAT16(2.0f), FLOAT16(1.5f), FLOAT16(-0.5f), FLOAT16(4.0f), FLOAT16(-1.0f), FLOAT16(3.5f) });
@@ -2125,8 +2125,8 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_avg_3x3_input_2x2_pool_2x2_stride)
     topology topology;
     topology.add(input_layout("input", input_prim->get_layout()));
     topology.add(reorder("reorder_input", "input", layout(data_types::f16, format::fs_b_yx_fsv32, { 1, 1, 3, 3 })));
-    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }));
-    topology.add(reorder("reorder_after_pooling", "avg_pooling", layout(data_types::f16, format::bfyx, { 1,1,3,3 })));
+    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }));
+    topology.add(reorder("reorder_after_pooling", "avg_pooling", layout(data_types::f16, format::bfyx, { 1, 1, 3, 3 })));
 
     network network(engine, topology);
     set_values(input_prim, { FLOAT16(-0.5f), FLOAT16(1.0f), FLOAT16(0.5f), FLOAT16(2.0f), FLOAT16(1.5f), FLOAT16(-0.5f), FLOAT16(4.0f), FLOAT16(-1.0f), FLOAT16(3.5f) });
@@ -2191,7 +2191,7 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_avg_2x2x3x3_input_2x2_pool_2x2_stride)
     topology topology;
     topology.add(input_layout("input", input_prim->get_layout()));
     topology.add(reorder("reorder_input", "input", layout(data_types::f16, format::fs_b_yx_fsv32, { batch_count, features_count, 3, 3 })));
-    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }));
+    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }));
     topology.add(reorder("reorder_after_pooling", "avg_pooling", layout(data_types::f16, format::bfyx, { batch_count, features_count, out_y, out_x })));
 
     network network(engine, topology);
@@ -2262,8 +2262,8 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_max_1x1x3x3_input_2x2_pool_2x2_stride_2x
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
         topology.add(reorder("reorder_input", "input_prim", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor)));
-        topology.add(pooling("pool_prim", "reorder_input", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,1,1 }, 0 }));
-        topology.add(reorder("reorder_pooling", "pool_prim", layout(data_types::f16, format::bfyx, { 1,1,4,4 }, padding{ {0,0,1,1},0 })));
+        topology.add(pooling("pool_prim", "reorder_input", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 1, 1 }, 0 }));
+        topology.add(reorder("reorder_pooling", "pool_prim", layout(data_types::f16, format::bfyx, { 1,1,4,4 }, padding{ { 0, 0, 1, 1 }, 0 })));
 
         network network(engine, topology);
 
@@ -2334,9 +2334,9 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_max_1x1x5x5_input_2x2_pool_2x2_stride_2x
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(reorder("reorder_input", "input_prim", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor, padding{ { 0,0,2,1 } , 0 })));
-    topology.add(pooling("pool_prim", "reorder_input", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,1,1 }, 0 }));
-    topology.add(reorder("reorder_pooling", "pool_prim", layout(data_types::f16, format::bfyx, input_tensor, padding{{0,0,1,1},0})));
+    topology.add(reorder("reorder_input", "input_prim", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor, padding{ { 0, 0, 2, 1 } , 0 })));
+    topology.add(pooling("pool_prim", "reorder_input", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 1, 1 }, 0 }));
+    topology.add(reorder("reorder_pooling", "pool_prim", layout(data_types::f16, format::bfyx, input_tensor, padding{ { 0, 0, 1, 1 }, 0 })));
 
     network network(engine, topology);
 
@@ -2412,7 +2412,7 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_avg_65x5x6x7_input_3x3_pool_4x4_stride_3
         topology golden_topology;
         golden_topology.add(input_layout("input", input_prim->get_layout()));
         golden_topology.add(reorder("reorder_input", "input", input_prim->get_layout().with_padding(padding{ {0,0,x_in_pad,y_in_pad},0 })));
-        golden_topology.add(pooling("golden_pooling", "reorder_input", pooling_mode::average, { 1,1,pool_size,pool_size }, { 1,1,stride_size,stride_size }, { 0,0,0,0 }, padding{ { 0,0,x_out_pad,y_out_pad },0 }));
+        golden_topology.add(pooling("golden_pooling", "reorder_input", pooling_mode::average, { 1, 1, pool_size, pool_size }, { 1, 1, stride_size, stride_size }, { 0, 0, 0, 0 }, "", padding{ { 0, 0, x_out_pad, y_out_pad }, 0 }));
 
         network golden_network(engine, golden_topology);
         golden_network.set_input_data("input", input_prim);
@@ -2428,8 +2428,8 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_avg_65x5x6x7_input_3x3_pool_4x4_stride_3
     { //FSV32 TOPOLOGY
         topology golden_topology;
         golden_topology.add(input_layout("input", input_prim->get_layout()));
-        golden_topology.add(reorder("reorder_input", "input", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor, padding{ {0,0,x_in_pad, y_in_pad}, 0 })));
-        golden_topology.add(pooling("fsv32_pooling", "reorder_input", pooling_mode::average, { 1,1,pool_size,pool_size }, { 1,1,stride_size,stride_size }, { 0,0,0,0 }, padding{ { 0,0,x_out_pad,y_out_pad },0 }));
+        golden_topology.add(reorder("reorder_input", "input", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor, padding{ {0, 0, x_in_pad, y_in_pad}, 0 })));
+        golden_topology.add(pooling("fsv32_pooling", "reorder_input", pooling_mode::average, { 1, 1, pool_size, pool_size }, { 1, 1, stride_size, stride_size }, { 0, 0, 0, 0 }, "", padding{ { 0, 0, x_out_pad, y_out_pad }, 0 }));
         golden_topology.add(reorder("reorder_pooling", "fsv32_pooling", layout(data_types::f16, format::bfyx, input_tensor, padding{ { 0,0,x_out_pad,y_out_pad },0 })));
 
         network fsv32_network(engine, golden_topology);
@@ -3481,10 +3481,10 @@ public:
                     all_layer_params.emplace_back(new pooling("pooling", "reorder0", pooling_mode, size, stride));
 
                     // Output padding
-                    all_layer_params.emplace_back(new pooling("pooling", "input0", pooling_mode, size, stride, generate_input_offset(2, 3, size), { { 0, 0, 1, 5 },{ 0, 0, 19, 4 } }));
+                    all_layer_params.emplace_back(new pooling("pooling", "input0", pooling_mode, size, stride, generate_input_offset(2, 3, size), "", { { 0, 0, 1, 5 }, { 0, 0, 19, 4 } }));
 
                     // Input + output padding
-                    all_layer_params.emplace_back(new pooling("pooling", "reorder0", pooling_mode, size, stride, generate_input_offset(2, 3, size), { { 0, 0, 2, 1 },{ 0, 0, 3, 4 } }));
+                    all_layer_params.emplace_back(new pooling("pooling", "reorder0", pooling_mode, size, stride, generate_input_offset(2, 3, size), "", { { 0, 0, 2, 1 }, { 0, 0, 3, 4 } }));
                 }
             }
         }
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/proposal_cpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/proposal_cpu_test.cpp
index a7ea1040828..5bb4fdecdac 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/proposal_cpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/proposal_cpu_test.cpp
@@ -88,6 +88,7 @@ TestRunnerProposal<Dtype, ImInfoType>::TestRunnerProposal(cldnn::tensor image_in
                                         post_nms_topn,
                                         ratios,
                                         scales,
+                                        "",
                                         padding())
 {
     _topology.add(input_layout(cls_scores_name, _cls_scores_layout));
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/quantize_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/quantize_gpu_test.cpp
index f5090ab08ff..393c54378c9 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/quantize_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/quantize_gpu_test.cpp
@@ -583,3 +583,242 @@ TEST(quantize_gpu, quantize_levels_256_3d_unsigned) {
         EXPECT_EQ(output_ptr[i], ref_data[i]) << " i=" << i;
     }
 }
+
+struct quantize_random_test_params {
+    data_types  input_type;
+    data_types  output_type;
+
+    tensor      input_size;
+
+    format::type in_format;
+    format::type out_format;
+
+    int32_t inputs_num;  // 5: ref
+};
+
+struct quantize_random_test : testing::TestWithParam<quantize_random_test_params>
+{
+    template <typename T>
+    void fill_typed(memory::ptr src, memory::ptr dst) {
+        auto size = dst->get_layout().size;
+        size_t b = size.batch[0];
+        size_t f = size.feature[0];
+        size_t x = size.spatial[0];
+        size_t y = size.spatial[1];
+
+        mem_lock<T> data{src, get_test_stream()};
+        mem_lock<T> ptr{dst, get_test_stream()};
+        for (size_t bi = 0; bi < b; ++bi) {
+            for (size_t fi = 0; fi < f; ++fi) {
+                for (size_t yi = 0; yi < y; ++yi) {
+                    for (size_t xi = 0; xi < x; ++xi) {
+                        auto coords = tensor(batch(bi), feature(fi), spatial(xi, yi, 0, 0));
+                        auto offset = dst->get_layout().get_linear_offset(coords);
+                        auto src_offset = src->get_layout().get_linear_offset(coords);
+                        ptr[offset] = data[src_offset];
+                    }
+                }
+            }
+        }
+    }
+
+    template <typename T>
+    void fill_random_typed(memory::ptr mem, int min, int max, int k) {
+        auto size = mem->get_layout().size;
+        size_t b = size.batch[0];
+        size_t f = size.feature[0];
+        size_t x = size.spatial[0];
+        size_t y = size.spatial[1];
+
+        auto data = generate_random_4d<T>(b, f, y, x, min, max, k);
+        mem_lock<T> ptr{mem, get_test_stream()};
+        for (size_t bi = 0; bi < b; ++bi) {
+            for (size_t fi = 0; fi < f; ++fi) {
+                for (size_t yi = 0; yi < y; ++yi) {
+                    for (size_t xi = 0; xi < x; ++xi) {
+                        auto coords = tensor(batch(bi), feature(fi), spatial(xi, yi, 0, 0));
+                        auto offset = mem->get_layout().get_linear_offset(coords);
+                        ptr[offset] = data[bi][fi][yi][xi];
+                    }
+                }
+            }
+        }
+    }
+
+    void fill_random(memory::ptr mem) {
+        auto dt = mem->get_layout().data_type;
+        switch (dt) {
+        case data_types::f32:
+            fill_random_typed<float>(mem, -127, 127, 2);
+            break;
+        case data_types::f16:
+            fill_random_typed<FLOAT16>(mem, -127, 127, 2);
+            break;
+        case data_types::i8:
+            fill_random_typed<int8_t>(mem, -127, 127, 1);
+            break;
+        case data_types::u8:
+            fill_random_typed<uint8_t>(mem, 0, 255, 1);
+            break;
+        default:
+            break;
+        }
+    }
+
+    template <typename T>
+    bool compare_outputs(const memory::ptr out_ref, const memory::ptr out_opt) {
+        auto output_lay = out_ref->get_layout();
+        auto opt_output_lay = out_opt->get_layout();
+
+        size_t b = output_lay.size.batch[0];
+        size_t f = output_lay.size.feature[0];
+        size_t x = output_lay.size.spatial[0];
+        size_t y = output_lay.size.spatial[1];
+        mem_lock<T> ref_ptr{out_ref, get_test_stream()};
+        mem_lock<T> opt_ptr{out_opt, get_test_stream()};
+        for (size_t bi = 0; bi < b; ++bi) {
+            for (size_t fi = 0; fi < f; ++fi) {
+                for (size_t yi = 0; yi < y; ++yi) {
+                    for (size_t xi = 0; xi < x; ++xi) {
+                        auto ref_out_coords = tensor(batch(bi), feature(fi), spatial(xi, yi, 0, 0));
+                        auto ref_out_offset = output_lay.get_linear_offset(ref_out_coords);
+                        auto ref_out_val = ref_ptr[ref_out_offset];
+
+                        auto opt_out_offset = opt_output_lay.get_linear_offset(ref_out_coords);
+                        auto opt_out_val = opt_ptr[opt_out_offset];
+
+                        EXPECT_EQ(opt_out_val, ref_out_val);
+                    }
+                }
+            }
+        }
+
+        return true;
+    }
+
+    void execute_compare(const quantize_random_test_params& params, bool check_result) {
+        auto& engine = get_test_engine();
+
+        auto in_layout = layout(params.input_type, params.in_format, params.input_size);
+        auto input = engine.allocate_memory(in_layout);
+        fill_random(input);
+
+        auto input_low   = engine.allocate_memory({ data_types::f32, format::bfyx, { 1, 1, 1, 1 } });
+        auto input_high  = engine.allocate_memory({ data_types::f32, format::bfyx, { 1, 1, 1, 1 } });
+        auto output_low  = engine.allocate_memory({ data_types::f32, format::bfyx, { 1, 1, 1, 1 } });
+        auto output_high = engine.allocate_memory({ data_types::f32, format::bfyx, { 1, 1, 1, 1 } });
+
+        // For quantize_gpu_scale_shift_opt
+        auto input_scale   = engine.allocate_memory({ data_types::f32, format::bfyx, { 1, 1, 1, 1 } });
+        auto input_shift   = engine.allocate_memory({ data_types::f32, format::bfyx, { 1, 1, 1, 1 } });
+        auto output_scale  = engine.allocate_memory({ data_types::f32, format::bfyx, { 1, 1, 1, 1 } });
+        auto output_shift  = engine.allocate_memory({ data_types::f32, format::bfyx, { 1, 1, 1, 1 } });
+
+        set_values(input_low,  { 0.0f });
+        set_values(input_high, { 40.0f });
+        set_values(output_low,  { 0.0f });
+        set_values(output_high, { 255.0f });
+
+        set_values(input_scale, { 2.0f });
+        set_values(input_shift, { 4.0f });
+        set_values(output_scale, { 2.0f });
+        set_values(output_shift, { 4.0f });
+
+        // Execute quantize_gpu_ref
+        cldnn::topology topo;
+        if (params.inputs_num == 5) {
+            topo.add(
+                input_layout("input", input->get_layout()),
+                data("input_low", input_low),
+                data("input_high", input_high),
+                data("output_low", output_low),
+                data("output_high", output_high),
+                quantize("quantize", "input", "input_low", "input_high", "output_low", "output_high", 256, params.output_type)
+            );
+        } else {
+            FAIL() << "Not supported inputs number: " << params.inputs_num;
+        }
+
+        auto build_ops = build_options();
+        build_ops.set_option(build_option::outputs({"quantize"}));
+
+        network net(engine, topo, build_ops);
+        net.set_input_data("input", input);
+
+        auto result = net.execute();
+        auto output = result.at("quantize").get_memory();
+
+        auto input_opt = engine.allocate_memory(in_layout);
+        if (params.input_type == data_types::f32) {
+            fill_typed<float>(input, input_opt);
+        } else if (params.input_type == data_types::f16) {
+            fill_typed<FLOAT16>(input, input_opt);
+        } else if (params.input_type == data_types::i8) {
+            fill_typed<int8_t>(input, input_opt);
+        } else if (params.input_type == data_types::u8) {
+            fill_typed<uint8_t>(input, input_opt);
+        } else {
+            FAIL() << "Not supported input data type: " << static_cast<size_t>(params.input_type);
+        }
+
+        cldnn::topology topo_opt;
+        if (params.inputs_num == 5) {
+            topo_opt.add(
+                input_layout("input_opt", input_opt->get_layout()),
+                reorder("input_re", "input_opt", format::bfyx, params.input_type),
+                data("input_low", input_low),
+                data("input_high", input_high),
+                data("output_low", output_low),
+                data("output_high", output_high),
+                quantize("quantize_opt", "input_re", "input_low", "input_high", "output_low", "output_high", 256, params.output_type),
+                reorder("out", "quantize_opt", params.out_format, params.output_type)
+            );
+        } else {
+            FAIL() << "Not supported inputs number: " << params.inputs_num;
+        }
+
+        auto buildops_opt = build_options();
+
+        network net_opt(engine, topo_opt, buildops_opt);
+        net_opt.set_input_data("input_opt", input_opt);
+
+        auto result_opt = net_opt.execute();
+        auto output_opt = result_opt.at("out").get_memory();
+
+        if (check_result == true) {
+            // Check data_types
+            if (params.output_type == data_types::f32) {
+                compare_outputs<float>(output, output_opt);
+            } else if (params.output_type == data_types::f16) {
+                compare_outputs<FLOAT16>(output, output_opt);
+            } else if (params.output_type == data_types::i8) {
+                compare_outputs<int8_t>(output, output_opt);
+            } else if (params.output_type == data_types::u8) {
+                compare_outputs<uint8_t>(output, output_opt);
+            } else {
+                FAIL() << "Not supported output data type: " << static_cast<size_t>(params.output_type);
+            }
+        }
+    }
+};
+
+struct quantize_random_test_param_generator : std::vector<quantize_random_test_params> {
+    quantize_random_test_param_generator& simple_params(data_types input_type, data_types output_type, format::type input_format, format::type output_format, int32_t inputs_num) {
+        push_back(quantize_random_test_params{ input_type, output_type, {1, 32, 2, 2}, input_format, output_format, inputs_num});
+        push_back(quantize_random_test_params{ input_type, output_type, {1, 16, 10, 10}, input_format, output_format, inputs_num});
+        return *this;
+    }
+};
+
+TEST_P(quantize_random_test, random) {
+    auto param = GetParam();
+    execute_compare(param, true);
+}
+
+INSTANTIATE_TEST_SUITE_P(quantize_smoke,
+                        quantize_random_test,
+                        testing::ValuesIn(
+                            quantize_random_test_param_generator()
+                            .simple_params(data_types::f32, data_types::u8, format::bs_fs_yx_bsv32_fsv32, format::bs_fs_yx_bsv32_fsv32, 5)
+                            .simple_params(data_types::f32, data_types::u8, format::b_fs_yx_fsv16, format::b_fs_yx_fsv16, 5)
+                        ));
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/reorder_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/reorder_gpu_test.cpp
index 3070fc90286..f2ce1cfbde5 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/reorder_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/reorder_gpu_test.cpp
@@ -290,7 +290,7 @@ TEST(reorder_gpu_f32, basic) {
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb, { 2, 2, 2, 2 } });
-    layout output_layout(data_types::f32, format::bfyx,{ 2,2,2,2 });
+    layout output_layout(data_types::f32, format::bfyx,{ 2, 2, 2, 2 });
 
     set_values(input, {
         1.f, 0.f,
@@ -375,7 +375,7 @@ TEST(reorder_gpu_f32, basic_subtract) {
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32,  format::yxfb, { 2, 2, 2, 2 } });
-    layout output_layout( data_types::f32, format::bfyx, {2,2,2,2} );
+    layout output_layout( data_types::f32, format::bfyx, { 2, 2, 2, 2 } );
     auto subtract = engine.allocate_memory({ data_types::f32, format::byxf, { 1, 2, 2, 2 } });
 
     set_values(input, {
@@ -464,7 +464,7 @@ TEST(reorder_gpu_f32, basic_subtract_value) {
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb, { 2, 2, 2, 2 } });
-    layout output_layout(data_types::f32, format::bfyx,{ 2,2,2,2 });
+    layout output_layout(data_types::f32, format::bfyx,{ 2, 2, 2, 2 });
     std::vector<float> subtract_val = { 0.5, 2.5 };
 
     set_values(input, {
@@ -555,7 +555,7 @@ TEST(reorder_gpu_f16, basic_subtract_f32_output_f32) {
     }
 
     auto input = engine.allocate_memory({ data_types::f16, format::yxfb, { 2, 2, 2, 2 } });
-    layout output_layout(data_types::f32, format::bfyx,{ 2,2,2,2 });
+    layout output_layout(data_types::f32, format::bfyx,{ 2, 2, 2, 2 });
     auto subtract = engine.allocate_memory({ data_types::f32, format::byxf, { 1, 2, 2, 2 } });
 
     set_values(input, {
@@ -649,7 +649,7 @@ TEST(reorder_gpu_f16, basic_subtract_value) {
     }
 
     auto input = engine.allocate_memory({ data_types::f16, format::yxfb, { 2, 2, 2, 2 } });
-    layout output_layout(data_types::f16, format::bfyx,{ 2,2,2,2 });
+    layout output_layout(data_types::f16, format::bfyx,{ 2, 2, 2, 2 });
     std::vector<float> subtract_val = { 0.5, 2.5 };
 
     set_values(input, {
@@ -789,8 +789,8 @@ TEST(reorder_gpu, basic_convert_f16_f32_f16) {
 TEST(reorder_gpu, basic_convert_int8) {
 
     auto& engine = get_test_engine();
-    layout in_layout = { type_to_data_type<float>::value,format::byxf,{ 1,1,3,3 } };
-    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx,{ 1,1,3,3 } };
+    layout in_layout = { type_to_data_type<float>::value,format::byxf,{ 1, 1, 3, 3 } };
+    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx,{ 1, 1, 3, 3 } };
     std::initializer_list<float> input_f = { 1.0f, -2.5f, 3.1f, -4.0f, 5.03f, -6.99f, 7.0f, -8.0f, 9.0f };
     std::list<float> final_results = { 1.0f, -3.0f, 3.0f, -4.0f, 5.0f, -7.0f, 7.0f, -8.0f, 9.0f };
 
@@ -835,74 +835,75 @@ TEST(reorder_gpu, basic_convert_int8) {
 }
 
 TEST(reorder_gpu, basic_convert_uint8rgbabyxf_to_fp32_bfyx) {
-	//  Converts an ARGB(uint8) image to common clDNN input of bfyx FP32
-	//
-	//  Input               : 1x5x5x4 (UINT8)
-	//  Intermediate        : 1x4x5x5 (FP32) {different mem format and ordering}
-	//  Output              : 1x3x5x5 (FP32) {using crop layer to reduce feature dimention and drop A from RGBA}
-	//
-	//  Output is expected to contain the same value as input
-	//
-	const int kernel_size = 5;
-	const int feature_size = 4;
-	auto& engine = get_test_engine();
+    //  Converts an ARGB(uint8) image to common clDNN input of bfyx FP32
+    //
+    //  Input               : 1x5x5x4 (UINT8)
+    //  Intermediate        : 1x4x5x5 (FP32) {different mem format and ordering}
+    //  Output              : 1x3x5x5 (FP32) {using crop layer to reduce feature dimention and drop A from RGBA}
+    //
+    //  Output is expected to contain the same value as input
+    //
+    const int kernel_size = 5;
+    const int feature_size = 4;
+    auto& engine = get_test_engine();
 
-	if (!engine.get_device_info().supports_fp16)
-	{
-		std::cout << "[ SKIPPED ] The test is skipped (cl_khr_fp16 is not supported)." << std::endl;
-		EXPECT_EQ(1, 1);
-		return;
-	}
+    if (!engine.get_device_info().supports_fp16)
+    {
+        std::cout << "[ SKIPPED ] The test is skipped (cl_khr_fp16 is not supported)." << std::endl;
+        EXPECT_EQ(1, 1);
+        return;
+    }
 
-	std::initializer_list<uint8_t> input_i8 = { 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20,
-		55, 54, 53, 52, 51, 50, 49, 48, 47, 46, 45, 44, 43, 42, 41, 40, 39, 38, 37, 36,
-		101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120,
-		155, 154, 153, 152, 151, 150, 149, 148, 147, 146, 145, 144, 143, 142, 141, 140, 139, 138, 137, 136,
-		255, 254, 253, 252, 251, 250, 249, 248, 247, 246, 245, 244, 243, 242, 241, 240, 239, 238, 237, 236
-	};
+    std::initializer_list<uint8_t> input_i8 = { 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20,
+        55, 54, 53, 52, 51, 50, 49, 48, 47, 46, 45, 44, 43, 42, 41, 40, 39, 38, 37, 36,
+        101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120,
+        155, 154, 153, 152, 151, 150, 149, 148, 147, 146, 145, 144, 143, 142, 141, 140, 139, 138, 137, 136,
+        255, 254, 253, 252, 251, 250, 249, 248, 247, 246, 245, 244, 243, 242, 241, 240, 239, 238, 237, 236
+    };
 
-	layout in_layout = { type_to_data_type<uint8_t>::value,format::byxf,{ 1,4,kernel_size,kernel_size } };
-	layout output_layout = { type_to_data_type<float>::value, format::bfyx, {1,4,kernel_size,kernel_size } };
+    layout in_layout = { type_to_data_type<uint8_t>::value,format::byxf,{ 1, 4, kernel_size,kernel_size } };
+    layout output_layout = { type_to_data_type<float>::value, format::bfyx, { 1, 4, kernel_size,kernel_size } };
 
-	// Allocate memory for input image.
-	auto input_memory = engine.allocate_memory(in_layout);
-	set_values(input_memory, input_i8);
+    // Allocate memory for input image.
+    auto input_memory = engine.allocate_memory(in_layout);
+    set_values(input_memory, input_i8);
 
     // Create input_layout description
-	// "input" - is the primitive id inside topology
-	input_layout input("input", in_layout);
+    // "input" - is the primitive id inside topology
+    input_layout input("input", in_layout);
 
-	// Create topology object with 2 primitives
-	topology topology(
-		// 1. input layout primitive.
-		input,
-		// 2. reorder primitive with id "reorder_input"
-		reorder("reorder_input",
-			// input primitive for reorder (implicitly converted to primitive_id)
-			input,
-			// output layout for reorder
-			output_layout)
-	);
+    // Create topology object with 2 primitives
+    topology topology(
+        // 1. input layout primitive.
+        input,
+        // 2. reorder primitive with id "reorder_input"
+        reorder("reorder_input",
+            // input primitive for reorder (implicitly converted to primitive_id)
+            input,
+            // output layout for reorder
+            output_layout)
+    );
 
-	tensor crop_reference_input_tensor(spatial(kernel_size, kernel_size), batch(1), feature(4 - 1));
-	tensor crop_offset_tensor(spatial(0, 0), batch(0), feature(0));
-	padding output_padding = padding({ 0,0,0,0 }, { 0,0,0,0 }, 0);
-	topology.add(
-		// cropping primitive with id "crop1"
-		crop("crop",
-			"reorder_input",    // primitive id of the cropping input
-			crop_reference_input_tensor,  // input tensor
-			crop_offset_tensor,    // bias primitive id
-			output_padding
-		)
-	);
+    tensor crop_reference_input_tensor(spatial(kernel_size, kernel_size), batch(1), feature(4 - 1));
+    tensor crop_offset_tensor(spatial(0, 0), batch(0), feature(0));
+    padding output_padding = padding({ 0, 0, 0, 0 }, { 0, 0, 0, 0 }, 0);
+    topology.add(
+        // cropping primitive with id "crop1"
+        crop("crop",
+             "reorder_input",               // primitive id of the cropping input
+             crop_reference_input_tensor,   // input tensor
+             crop_offset_tensor,            // bias primitive id
+             "",
+             output_padding
+            )
+    );
 
-	network network(
-		engine,
-		topology,
+    network network(
+        engine,
+        topology,
         build_options{
-			build_option::outputs({ "reorder_input", "crop" })
-		});
+            build_option::outputs({ "reorder_input", "crop" })
+        });
 
     network.set_input_data("input", input_memory);
 
@@ -979,7 +980,7 @@ TEST(reorder_gpu_f32, basic_yxfb_to_bfyx_input_padding)
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ 2, 2, 2, 2 } });
-    layout output_layout(data_types::f32, format::bfyx, { 2,2,2,2 });
+    layout output_layout(data_types::f32, format::bfyx, { 2, 2, 2, 2 });
 
     set_values(input, {
         1.f, 0.f,
@@ -997,7 +998,7 @@ TEST(reorder_gpu_f32, basic_yxfb_to_bfyx_input_padding)
 
     topology topology(
         input_layout("input", input->get_layout()),
-        reorder("reorder", "input", input->get_layout().format, input->get_layout().data_type, "", reorder_mean_mode::subtract, padding{ { 0, 0, 1, 2 }, 0 }),
+        reorder("reorder", "input", input->get_layout().format, input->get_layout().data_type, "", reorder_mean_mode::subtract, "", padding{ { 0, 0, 1, 2 }, 0 }),
         reorder("reorder2", "reorder", output_layout));
 
     network network(engine, topology);
@@ -1058,7 +1059,7 @@ TEST(reorder_gpu_f32, basic_bfyx_to_yxfb_input_padding)
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::bfyx,{ 2, 2, 2, 2 } });
-    layout output_layout(data_types::f32, format::yxfb, { 2,2,2,2 });
+    layout output_layout(data_types::f32, format::yxfb, { 2, 2, 2, 2 });
 
     set_values(input, {
         1.0f,  2.0f,
@@ -1076,7 +1077,7 @@ TEST(reorder_gpu_f32, basic_bfyx_to_yxfb_input_padding)
 
     topology topology(
         input_layout("input", input->get_layout()),
-        reorder("reorder", "input", input->get_layout().format, input->get_layout().data_type, "", reorder_mean_mode::subtract, padding{ { 0, 0, 2, 1 }, 0 }),
+        reorder("reorder", "input", input->get_layout().format, input->get_layout().data_type, "", reorder_mean_mode::subtract, "", padding{ { 0, 0, 2, 1 }, 0 }),
         reorder("reorder2", "reorder", output_layout));
 
     network network(engine, topology);
@@ -1357,12 +1358,12 @@ TEST(reorder_gpu_opt, remove_redundant_activation_fuse)
 
     memory::ptr in = engine.allocate_memory({ data_types::f32, format::bfyx, tensor{ 1, 1, 2, 1 } });
     set_values(in, { -1.0f, -1.0f });
-    memory::ptr scale_mem = engine.allocate_memory({ data_types::f32, format::bfyx, tensor{1, 1, 1, 1 } });
+    memory::ptr scale_mem = engine.allocate_memory({ data_types::f32, format::bfyx, tensor{ 1, 1, 1, 1 } });
     set_values(scale_mem, { 2.0f });
     topology tpl{
         input_layout("in", in->get_layout()),
         reorder("r1", "in", format::bfyx, data_types::f32),
-        activation("relu", "r1", activation_func::relu_negative_slope, {0.01f, 0.0f}),
+        activation("relu", "r1", activation_func::relu_negative_slope, { 0.01f, 0.0f }),
         data("scale_data", scale_mem),
         scale("output", "relu", "scale_data")
     };
@@ -1467,7 +1468,7 @@ TEST(reorder_gpu_opt, mean_mul)
     auto& engine = get_test_engine();
 
     memory::ptr in  = engine.allocate_memory({ data_types::i8, format::bfyx, tensor{ 1, 3, 1, 2 } });
-    memory::ptr mul = engine.allocate_memory({ data_types::f32, format::bfyx, tensor{1, 3, 1, 2 } });
+    memory::ptr mul = engine.allocate_memory({ data_types::f32, format::bfyx, tensor{ 1, 3, 1, 2 } });
 
     set_values<char>(in,
     { 1, 2,
@@ -1598,7 +1599,7 @@ TEST(reorder_gpu_i32, basic)
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::bfyx,{ 2, 2, 2, 2 } });
-    layout output_layout(data_types::i32, format::bfyx, { 2,2,2,2 });
+    layout output_layout(data_types::i32, format::bfyx, { 2, 2, 2, 2 });
 
     set_values(input, {
         1.f, 0.f, 5.f, 1.5f,
@@ -1639,7 +1640,7 @@ TEST(reorder_gpu_i64, basic)
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::bfyx,{ 2, 2, 2, 2 } });
-    layout output_layout(data_types::i64, format::bfyx, { 2,2,2,2 });
+    layout output_layout(data_types::i64, format::bfyx, { 2, 2, 2, 2 });
 
     set_values(input, {
         1.f, 0.f, 5.f, 1.5f,
@@ -1910,11 +1911,11 @@ TEST(reorder_gpu_f32, bfzyx_to_bsv16_fsv16)
             for (int32_t z = 0; z < z_in; z++) {
                 for (int32_t y = 0; y < y_in; y++) {
                     for (int32_t x = 0; x < x_in; x++) {
-                        int32_t bsv16_fsv16_index = get_bsv16_fsv16_index(b_in,f_in,z_in,y_in,x_in,b,
-                                                                          0,f,0,
-                                                                          0,z,0,
-                                                                          0,y,0,
-                                                                          0,x,0);
+                        int32_t bsv16_fsv16_index = get_bsv16_fsv16_index(b_in, f_in, z_in, y_in, x_in, b,
+                                                                          0, f, 0,
+                                                                          0, z, 0,
+                                                                          0, y, 0,
+                                                                          0, x, 0);
                         EXPECT_FLOAT_EQ(input_ptr[linear_index++], output_ptr[bsv16_fsv16_index]);
                     }
                 }
@@ -1937,14 +1938,14 @@ TEST(reorder_gpu_f32, bfzyx_to_bsv16_fsv16_padded)
     const int32_t y_pad= 2;
     const int32_t x_pad= 1;
 
-    auto input = engine.allocate_memory({ data_types::f32, format::bfzyx, { b_in,f_in,x_in,y_in,z_in } });
-    layout output_layout(data_types::f32, format::bs_fs_zyx_bsv16_fsv16,{ b_in,f_in,x_in,y_in,z_in });
+    auto input = engine.allocate_memory({ data_types::f32, format::bfzyx, { b_in, f_in, x_in, y_in, z_in } });
+    layout output_layout(data_types::f32, format::bs_fs_zyx_bsv16_fsv16, { b_in, f_in, x_in, y_in, z_in });
 
     tests::set_random_values<float>(input);
 
     topology topology(
             input_layout("input", input->get_layout()),
-            reorder("reorder", "input", output_layout.with_padding(padding({0, 0, x_pad, y_pad, 0}, 0.f))));
+            reorder("reorder", "input", output_layout.with_padding(padding({ 0, 0, x_pad, y_pad, 0 }, 0.f))));
 
     network network(engine, topology);
     network.set_input_data("input", input);
@@ -1992,11 +1993,11 @@ TEST(reorder_gpu_f32, bfzyx_to_bsv16_fsv16_padded)
             for (int32_t z = 0; z < z_in; z++) {
                 for (int32_t y = 0; y < y_in; y++) {
                     for (int32_t x = 0; x < x_in; x++) {
-                        int32_t bsv16_fsv16_index = get_bsv16_fsv16_index(b_in,f_in,z_in,y_in,x_in,b,
-                                                                          f_pad,f,f_pad,
-                                                                          z_pad,z,z_pad,
-                                                                          y_pad,y,y_pad,
-                                                                          x_pad,x,x_pad);
+                        int32_t bsv16_fsv16_index = get_bsv16_fsv16_index(b_in, f_in, z_in, y_in, x_in, b,
+                                                                          f_pad, f, f_pad,
+                                                                          z_pad, z, z_pad,
+                                                                          y_pad, y, y_pad,
+                                                                          x_pad, x, x_pad);
                         EXPECT_FLOAT_EQ(input_ptr[linear_index++], output_ptr[bsv16_fsv16_index]);
                     }
                 }
@@ -2066,7 +2067,7 @@ TEST(reorder_gpu_f32, b_fs_yx_fsv16_to_bfyx_opt_not_allowed)
             input_layout("input", input->get_layout()),
             data("weights", weights),
             reorder(reorder_name, "input", format::bfyx, data_types::f32),
-            convolution("convolution", reorder_name, {"weights"}, {1,1,1,1}, {0,0,-1,-1}, {1,1,1,1}));
+            convolution("convolution", reorder_name, {"weights"}, { 1, 1, 1, 1 }, { 0, 0, -1, -1 }, { 1, 1, 1, 1 }));
 
     build_options bo;
     bo.set_option(build_option::optimize_data(true));
@@ -2099,7 +2100,7 @@ TEST(reorder_gpu_f32, b_fs_yx_fsv16_to_bfyx_opt_padded)
     auto input = engine.allocate_memory({ data_types::f32,
                                             format::b_fs_yx_fsv16,
                                             { 2, 4, 1, 1 },
-                                            padding({1, 16, 0, 0}, {1, 0, 0, 0}) });
+                                            padding({ 1, 16, 0, 0 }, { 1, 0, 0, 0 }) });
 
     std::vector<float> in_data = {
         // b -1 (lower pad)
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/resample_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/resample_gpu_test.cpp
index a6bd31cf9f4..11cd1d39cd3 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/resample_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/resample_gpu_test.cpp
@@ -2037,3 +2037,195 @@ TEST(resample_gpu, interpolate_in1x1x2x4_linear_scale) {
         EXPECT_TRUE(are_equal(answers[i], output_ptr[i])) << i;
     }
 }
+
+struct resample_opt_random_test_params {
+    data_types input_type;
+    tensor input_size;
+    tensor output_size;
+    uint32_t num_filter;
+    resample_type operation_type;
+    uint32_t align_corners;
+    format::type in_format;
+    format::type out_format;
+    std::vector<int32_t> pads_begin;
+    std::vector<int32_t> pads_end;
+};
+
+struct resample_opt_random_test : testing::TestWithParam<resample_opt_random_test_params>
+{
+    bool enable_profiling = false;
+
+    template <typename T>
+    void fill_random_typed(memory::ptr mem, int min, int max, int k) {
+        auto size = mem->get_layout().size;
+        size_t b = size.batch[0];
+        size_t f = size.feature[0];
+        size_t x = size.spatial[0];
+        size_t y = size.spatial[1];
+
+        auto data = generate_random_4d<T>(b, f, y, x, min, max, k);
+        mem_lock<T> ptr{mem, get_test_stream()};
+        for (size_t bi = 0; bi < b; ++bi) {
+            for (size_t fi = 0; fi < f; ++fi) {
+                for (size_t yi = 0; yi < y; ++yi) {
+                    for (size_t xi = 0; xi < x; ++xi) {
+                        auto coords = tensor(batch(bi), feature(fi), spatial(xi, yi, 0, 0));
+                        auto offset = mem->get_layout().get_linear_offset(coords);
+                        ptr[offset] = data[bi][fi][yi][xi];
+                    }
+                }
+            }
+        }
+    }
+
+    void fill_random(memory::ptr mem) {
+        auto dt = mem->get_layout().data_type;
+        switch (dt) {
+        case data_types::f32:
+            fill_random_typed<float>(mem, -127, 127, 2);
+            break;
+        case data_types::f16:
+            fill_random_typed<FLOAT16>(mem, -127, 127, 2);
+            break;
+        case data_types::i8:
+            fill_random_typed<int8_t>(mem, -127, 127, 1);
+            break;
+        case data_types::u8:
+            fill_random_typed<uint8_t>(mem, 0, 255, 1);
+            break;
+        default:
+            break;
+        }
+    }
+
+    template <typename T>
+    bool compare_outputs(const memory::ptr out_ref, const memory::ptr out_opt) {
+        auto output_lay = out_ref->get_layout();
+        auto opt_output_lay = out_opt->get_layout();
+
+        size_t b = output_lay.size.batch[0];
+        size_t f = output_lay.size.feature[0];
+        size_t x = output_lay.size.spatial[0];
+        size_t y = output_lay.size.spatial[1];
+        mem_lock<T> ref_ptr{out_ref, get_test_stream()};
+        mem_lock<T> opt_ptr{out_opt, get_test_stream()};
+        for (size_t bi = 0; bi < b; ++bi) {
+            for (size_t fi = 0; fi < f; ++fi) {
+                for (size_t yi = 0; yi < y; ++yi) {
+                    for (size_t xi = 0; xi < x; ++xi) {
+                        auto ref_out_coords = tensor(batch(bi), feature(fi), spatial(xi, yi, 0, 0));
+                        auto ref_out_offset = output_lay.get_linear_offset(ref_out_coords);
+                        auto ref_out_val = ref_ptr[ref_out_offset];
+
+                        auto opt_out_offset = opt_output_lay.get_linear_offset(ref_out_coords);
+                        auto opt_out_val = opt_ptr[opt_out_offset];
+
+                        EXPECT_EQ(ref_out_offset, opt_out_offset);
+                        if (std::is_same<T, FLOAT16>::value) {
+                            EXPECT_NEAR(static_cast<float>(opt_out_val), static_cast<float>(ref_out_val), 1.e-1f);
+                        } else {
+                            EXPECT_EQ(opt_out_val, ref_out_val);
+                        }
+                    }
+                }
+            }
+        }
+
+        return true;
+    }
+
+    void execute_compare(const resample_opt_random_test_params& params, bool check_result) {
+        auto& engine = get_test_engine();
+
+        auto in_layout = layout(params.input_type, format::bfyx, params.input_size);
+        auto in_mem = engine.allocate_memory(in_layout);
+        fill_random(in_mem);
+
+        /// bfyx
+        cldnn::topology topo;
+        topo.add(input_layout("in", in_layout));
+        auto prim = resample("resample", "in", params.output_size, params.num_filter, params.operation_type);
+        prim.align_corners = params.align_corners;
+        prim.pads_begin = params.pads_begin;
+        prim.pads_end = params.pads_end;
+        topo.add(prim);
+
+        auto build_opts = build_options();
+        build_opts.set_option(build_option::outputs({"resample"}));
+
+        network net(engine, topo, build_opts);
+        net.set_input_data("in", in_mem);
+
+        // first execution of ref
+        auto result = net.execute();
+        auto output = result.at("resample").get_memory();
+
+        cldnn::topology topo_opt;
+        topo_opt.add(input_layout("in", in_layout));
+        topo_opt.add(reorder("in_to_input_type", "in", params.in_format, params.input_type));
+        auto prim_opt = resample("resample_opt", "in_to_input_type", params.output_size, params.num_filter, params.operation_type);
+        prim_opt.align_corners = params.align_corners;
+        prim_opt.pads_begin = params.pads_begin;
+        prim_opt.pads_end = params.pads_end;
+        topo_opt.add(prim_opt);
+        topo_opt.add(reorder("res_to_bfyx", "resample_opt", format::bfyx, params.input_type));
+
+        auto build_opts_opt = build_options();
+        build_opts_opt.set_option(build_option::outputs({"resample_opt", "res_to_bfyx"}));
+
+        network net_opt(engine, topo_opt, build_opts_opt);
+
+        // Use in_mem from ref network
+        net_opt.set_input_data("in", in_mem);
+
+        // first execution of opt
+        auto result_opt = net_opt.execute();
+        auto output_opt = result_opt.at("res_to_bfyx").get_memory();
+
+        if (check_result == true) {
+            // Check data_types
+            if (params.input_type == data_types::f32) {
+                compare_outputs<float>(output, output_opt);
+            } else if (params.input_type == data_types::f16) {
+                compare_outputs<FLOAT16>(output, output_opt);
+            } else if (params.input_type == data_types::i8) {
+                compare_outputs<int8_t>(output, output_opt);
+            } else if (params.input_type == data_types::u8) {
+                compare_outputs<uint8_t>(output, output_opt);
+            } else {
+                FAIL() << "Not supported data type: " << static_cast<size_t>(params.input_type);
+            }
+        }
+    }
+};
+
+TEST_P(resample_opt_random_test, random) {
+    auto param = GetParam();
+    execute_compare(param, true);
+}
+
+INSTANTIATE_TEST_SUITE_P(resample_opt_smoke_nearest,
+                         resample_opt_random_test,
+                         testing::ValuesIn(
+                            std::vector<resample_opt_random_test_params>{
+                                { data_types::i8,  {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::nearest, 1, format::b_fs_yx_fsv16, format::b_fs_yx_fsv16, {}, {}},
+                                { data_types::i8,  {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::nearest, 1, format::b_fs_yx_fsv32, format::b_fs_yx_fsv32, {}, {}},
+                                { data_types::i8,  {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::nearest, 1, format::bs_fs_yx_bsv32_fsv16, format::bs_fs_yx_bsv32_fsv16, {}, {}},
+                                { data_types::i8,  {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::nearest, 1, format::bs_fs_yx_bsv32_fsv32, format::bs_fs_yx_bsv32_fsv32, {}, {}},
+                                { data_types::f16, {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::nearest, 1, format::b_fs_yx_fsv16, format::b_fs_yx_fsv16, {}, {}},
+                                { data_types::f16, {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::nearest, 1, format::b_fs_yx_fsv32, format::b_fs_yx_fsv32, {}, {}},
+                                { data_types::f16, {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::nearest, 1, format::bs_fs_yx_bsv32_fsv16, format::bs_fs_yx_bsv32_fsv16, {}, {}},
+                                { data_types::f16, {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::nearest, 1, format::bs_fs_yx_bsv32_fsv32, format::bs_fs_yx_bsv32_fsv32, {}, {}},
+                            }
+                        ));
+
+INSTANTIATE_TEST_SUITE_P(resample_opt_smoke_linear_onnx,
+                         resample_opt_random_test,
+                         testing::ValuesIn(
+                            std::vector<resample_opt_random_test_params>{
+                                { data_types::f16, {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::linear_onnx, 1, format::b_fs_yx_fsv16, format::b_fs_yx_fsv16, {}, {}},
+                                { data_types::f16, {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::linear_onnx, 1, format::b_fs_yx_fsv32, format::b_fs_yx_fsv32, {}, {}},
+                                { data_types::f16, {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::linear_onnx, 1, format::bs_fs_yx_bsv32_fsv16, format::bs_fs_yx_bsv32_fsv16, {}, {}},
+                                { data_types::f16, {1, 128, 13, 13},  {1, 128, 26, 26},  1, resample_type::linear_onnx, 1, format::bs_fs_yx_bsv32_fsv32, format::bs_fs_yx_bsv32_fsv32, {}, {}},
+                            }
+                        ));
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/reshape_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/reshape_gpu_test.cpp
index ff35e58e75e..18916b3e3c3 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/reshape_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/reshape_gpu_test.cpp
@@ -62,7 +62,7 @@ void generic_reshape_test(format fmt, tensor const& input_size, tensor const& re
         tpl.add(reorder("reorder", "input", padded_input_layout));
         reshape_input = "reorder";
     }
-    tpl.add(reshape("reshape", reshape_input, reshape_size, output_padd));
+    tpl.add(reshape("reshape", reshape_input, reshape_size, "", output_padd));
 
     build_options bo;
     bo.set_option(build_option::outputs({reshape_input, "reshape"}));
@@ -525,7 +525,7 @@ TEST(reshape_gpu_f32, basic_bfwzyx) {
 
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(reshape("reshape", "input", tensor(batch(1), feature(1), spatial(2, 2, 3, 3)), padding({0, 0, 0, 0, 0, 1}, 0.f)));
+    topology.add(reshape("reshape", "input", tensor(batch(1), feature(1), spatial(2, 2, 3, 3)), "", padding({0, 0, 0, 0, 0, 1}, 0.f)));
 
     // clang-format off
     std::vector<float> input_data = {
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/spatial_concatenate_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/spatial_concatenate_gpu_test.cpp
index 286588efefa..2795968a94b 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/spatial_concatenate_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/spatial_concatenate_gpu_test.cpp
@@ -15,8 +15,8 @@ using namespace ::tests;
 TEST(spatial_concatenate_f32_gpu, test01) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -68,8 +68,8 @@ TEST(spatial_concatenate_f32_gpu, test01) {
 TEST(spatial_concatenate_f32_gpu, test02) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -123,8 +123,8 @@ TEST(spatial_concatenate_f32_gpu, test02) {
 TEST(spatial_concatenate_f32_gpu, test03) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -148,7 +148,7 @@ TEST(spatial_concatenate_f32_gpu, test03) {
     topology tpl;
     tpl.add(input_layout("in1", input1->get_layout()));
     tpl.add(input_layout("in2", input2->get_layout()));
-    tpl.add(concatenation("conc", { "in1", "in2" }, concatenation::along_y, padding({ 0, 0, 1, 1 }, 0.0f)));
+    tpl.add(concatenation("conc", { "in1", "in2" }, concatenation::along_y, "", padding({ 0, 0, 1, 1 }, 0.0f)));
 
     network net(engine, tpl);
     net.set_input_data("in1", input1);
@@ -180,8 +180,8 @@ TEST(spatial_concatenate_f32_gpu, test03) {
 TEST(spatial_concatenate_f32_gpu, test04) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 }, padding({ 0,0,0,0 }, { 0,0,1,0 }) });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 }, padding({ 0,0,0,1 }, 0.0f) });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 }, padding({ 0, 0, 0, 0 }, { 0, 0, 1, 0 }) });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 }, padding({ 0, 0, 0, 1 }, 0.0f) });
 
     set_values(input1, {
         1.0f, 2.0f, 0.0f,
@@ -203,7 +203,7 @@ TEST(spatial_concatenate_f32_gpu, test04) {
     topology tpl;
     tpl.add(input_layout("in1", input1->get_layout()));
     tpl.add(input_layout("in2", input2->get_layout()));
-    tpl.add(concatenation("conc", { "in1", "in2" }, concatenation::along_x, padding({ 0,0,2,0 }, { 0,0,0,0 })));
+    tpl.add(concatenation("conc", { "in1", "in2" }, concatenation::along_x, "", padding({ 0, 0, 2, 0 }, { 0, 0, 0, 0 })));
 
     network net(engine, tpl);
     net.set_input_data("in1", input1);
@@ -235,9 +235,9 @@ TEST(spatial_concatenate_f32_gpu, test04) {
 TEST(spatial_concatenate_f32_gpu, inputs_3) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
-    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
+    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -296,9 +296,9 @@ TEST(spatial_concatenate_f32_gpu, inputs_3) {
 TEST(spatial_concatenate_f32_gpu, inputs_3_uneven_axis_b) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 3,1,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
-    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 2,1,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 3, 1, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
+    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 2, 1, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -384,8 +384,8 @@ TEST(spatial_concatenate_f32_gpu, inputs_3_uneven_axis_b) {
 TEST(spatial_concatenate_f32_gpu, inputs3d_axis_x) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -444,8 +444,8 @@ TEST(spatial_concatenate_f32_gpu, inputs3d_axis_x) {
 TEST(spatial_concatenate_f32_gpu, inputs3d_axis_y) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -508,8 +508,8 @@ TEST(spatial_concatenate_f32_gpu, inputs3d_axis_y) {
 TEST(spatial_concatenate_f32_gpu, inputs3d_axis_z) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -572,8 +572,8 @@ TEST(spatial_concatenate_f32_gpu, inputs3d_axis_z) {
 TEST(spatial_concatenate_f32_gpu, inputs3d_axis_b) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 2,1,2,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 2, 1, 2, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -647,9 +647,9 @@ TEST(spatial_concatenate_f32_gpu, inputs3d_axis_b) {
 TEST(spatial_concatenate_f32_gpu, inputs3d_3_uneven_axis_b) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 3,1,2,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
-    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 2,1,2,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 3, 1, 2, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
+    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 2, 1, 2, 2, 2 } });
 
     set_values(input1, {
         //b0
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/streams_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/streams_test.cpp
index e7bbe9b553a..795020327ad 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/streams_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/streams_test.cpp
@@ -28,7 +28,7 @@ TEST(gpu_streams, can_create_networks_for_stream) {
 
     topology topology(
             input_layout("input", input->get_layout()),
-            activation("relu", "input", activation_func::relu_negative_slope, activation_additional_params{ 0.5f, 0.f }, padding{ { 0, 0, 0, 0 }, 0 }));
+            activation("relu", "input", activation_func::relu_negative_slope, activation_additional_params{ 0.5f, 0.f }, "", padding{ { 0, 0, 0, 0 }, 0 }));
     network network(engine, topology, build_options());
 
     network.set_input_data("input", input);
diff --git a/inference-engine/thirdparty/clDNN/tests/test_utils/network_test.h b/inference-engine/thirdparty/clDNN/tests/test_utils/network_test.h
index 018b247643d..0577fb8c075 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_utils/network_test.h
+++ b/inference-engine/thirdparty/clDNN/tests/test_utils/network_test.h
@@ -329,7 +329,7 @@ public:
                                                            std::shared_ptr<reference_node<BiasT, 2>> bias,
                                                            cldnn::implementation_desc force = cldnn::implementation_desc{cldnn::format::any, ""},
                                                            size_t input_dim_size = 3) {
-        topo.add(cldnn::fully_connected(id, input->id, weights->id, bias->id, cldnn::type_to_data_type<T>::value, cldnn::padding(), input_dim_size));
+        topo.add(cldnn::fully_connected(id, input->id, weights->id, bias->id, cldnn::type_to_data_type<T>::value, "", cldnn::padding(), input_dim_size));
         if (force.output_format != cldnn::format::any || force.kernel_name != "")
             forced_impls[id] = force;
         VVVVF<T> output_data = fully_connected_reference_typed_3d<T>(input->reference.reference,
diff --git a/inference-engine/thirdparty/clDNN/tests/test_utils/test_utils.cpp b/inference-engine/thirdparty/clDNN/tests/test_utils/test_utils.cpp
index bfa964350dd..a3d73ef6474 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_utils/test_utils.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_utils/test_utils.cpp
@@ -285,9 +285,8 @@ std::vector<std::shared_ptr<test_params>> generic_test::generate_generic_test_pa
     return all_generic_params;
 }
 
-cldnn::engine_configuration get_test_engine_config() {
+cldnn::engine_configuration get_test_engine_config(cldnn::queue_types queue_type) {
     const bool enable_profiling = false;
-    const cldnn::queue_types queue_type = cldnn::queue_types::out_of_order;
     std::string sources_dumps_dir = "";
     priority_mode_types priority_mode = priority_mode_types::disabled;
     throttle_mode_types throttle_mode = throttle_mode_types::disabled;
@@ -296,18 +295,28 @@ cldnn::engine_configuration get_test_engine_config() {
     return engine_configuration(enable_profiling, queue_type, sources_dumps_dir, priority_mode, throttle_mode, use_memory_pool, use_unified_shared_memory);
 }
 
-std::shared_ptr<cldnn::engine> create_test_engine() {
-    return cldnn::engine::create(engine_types::ocl, runtime_types::ocl, get_test_engine_config());
+std::shared_ptr<cldnn::engine> create_test_engine(cldnn::queue_types queue_type) {
+    return cldnn::engine::create(engine_types::ocl, runtime_types::ocl, get_test_engine_config(queue_type));
 }
 
 cldnn::engine& get_test_engine() {
     static std::shared_ptr<cldnn::engine> test_engine = nullptr;
     if (!test_engine) {
-        test_engine = create_test_engine();
+        test_engine = create_test_engine(cldnn::queue_types::out_of_order);
     }
     return *test_engine;
 }
 
+#ifdef ENABLE_ONEDNN_FOR_GPU
+cldnn::engine& get_onednn_test_engine() {
+    static std::shared_ptr<cldnn::engine> test_engine = nullptr;
+    if (!test_engine) {
+        test_engine = create_test_engine(cldnn::queue_types::in_order);
+    }
+    return *test_engine;
+}
+#endif
+
 cldnn::stream& get_test_stream() {
     static std::shared_ptr<cldnn::stream> test_stream = nullptr;
     if (!test_stream)
diff --git a/inference-engine/thirdparty/clDNN/tests/test_utils/test_utils.h b/inference-engine/thirdparty/clDNN/tests/test_utils/test_utils.h
index bfe6cfc1798..3435333421f 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_utils/test_utils.h
+++ b/inference-engine/thirdparty/clDNN/tests/test_utils/test_utils.h
@@ -45,8 +45,11 @@
 
 namespace tests {
 
-std::shared_ptr<cldnn::engine> create_test_engine();
+std::shared_ptr<cldnn::engine> create_test_engine(cldnn::queue_types queue_type = cldnn::queue_types::out_of_order);
 cldnn::engine& get_test_engine();
+#ifdef ENABLE_ONEDNN_FOR_GPU
+cldnn::engine& get_onednn_test_engine();
+#endif
 cldnn::stream& get_test_stream();
 
 #define USE_RANDOM_SEED 0
diff --git a/model-optimizer/CMakeLists.txt b/model-optimizer/CMakeLists.txt
index 220388cc871..8c8e70a5204 100644
--- a/model-optimizer/CMakeLists.txt
+++ b/model-optimizer/CMakeLists.txt
@@ -4,7 +4,7 @@
 if(NOT ENABLE_PYTHON)
     message(WARNING "Please enable IE & nGraph Python API (ie_api and offline_transformations_api) targets to enable Model Optimizer target")
 else()
-    add_custom_target(model_optimizer DEPENDS ie_api offline_transformations_api inference_engine_ir_reader)
+    add_custom_target(model_optimizer DEPENDS ie_api offline_transformations_api ir_ngraph_frontend)
     if(ENABLE_TESTS)
             add_subdirectory(unit_tests/mock_mo_frontend/mock_mo_ngraph_frontend)
             add_dependencies(model_optimizer mock_mo_ngraph_frontend)
diff --git a/model-optimizer/extensions/front/tf/ObjectDetectionAPI.py b/model-optimizer/extensions/front/tf/ObjectDetectionAPI.py
index a09bbc16e14..6c8937946f7 100644
--- a/model-optimizer/extensions/front/tf/ObjectDetectionAPI.py
+++ b/model-optimizer/extensions/front/tf/ObjectDetectionAPI.py
@@ -874,7 +874,7 @@ class ObjectDetectionAPIPreprocessor2Replacement(FrontReplacementFromConfigFileG
                 # replace sub-graph between start and end nodes (including them) with new_preprocessing_ops nodes
                 end_node.out_port(0).get_connection().set_source(new_preprocessing_ops[-1].out_port(0))
                 start_node.in_port(0).get_connection().set_destination(
-                    new_preprocessing_ops[0].in_port(new_preprocessing_ops[0].is_in_port_connected(0)))
+                    new_preprocessing_ops[0].in_port(int(new_preprocessing_ops[0].is_in_port_connected(0))))
             else:
                 if trailing:  # case 2
                     # change output of the end_node to be produced with the start node producer
diff --git a/model-optimizer/extensions/front/tf/non_max_suppression_ext.py b/model-optimizer/extensions/front/tf/non_max_suppression_ext.py
index 4bbb4b46fb3..9ea16cf1d9e 100644
--- a/model-optimizer/extensions/front/tf/non_max_suppression_ext.py
+++ b/model-optimizer/extensions/front/tf/non_max_suppression_ext.py
@@ -39,7 +39,7 @@ class NonMaxSuppressionV4Extractor(FrontExtractorOp):
     def extract(cls, node):
         pad_to_max_output_size = node.pb.attr["pad_to_max_output_size:"].b
         if not pad_to_max_output_size:
-            log.warning('The attribute "pad_to_max_output_size" of node {} is equal to False which is not supported.'
+            log.warning('The attribute "pad_to_max_output_size" of node {} is equal to False which is not supported. '
                         'Forcing it to be equal to True'.format(node.soft_get('name')))
         attrs = {'sort_result_descending': 1, 'box_encoding': 'corner', 'output_type': np.int32}
         NonMaxSuppression.update_node_stat(node, attrs)
@@ -54,7 +54,7 @@ class NonMaxSuppressionV5Extractor(FrontExtractorOp):
     def extract(cls, node):
         pad_to_max_output_size = node.pb.attr["pad_to_max_output_size:"].b
         if not pad_to_max_output_size:
-            log.warning('The attribute "pad_to_max_output_size" of node {} is equal to False which is not supported.'
+            log.warning('The attribute "pad_to_max_output_size" of node {} is equal to False which is not supported. '
                         'Forcing it to be equal to True'.format(node.soft_get('name')))
         attrs = {'sort_result_descending': 1, 'box_encoding': 'corner', 'output_type': np.int32}
         NonMaxSuppression.update_node_stat(node, attrs)
diff --git a/model-optimizer/extensions/load/tf/loader.py b/model-optimizer/extensions/load/tf/loader.py
index ae0f79b178b..46156e21612 100644
--- a/model-optimizer/extensions/load/tf/loader.py
+++ b/model-optimizer/extensions/load/tf/loader.py
@@ -55,7 +55,7 @@ class TFLoader(Loader):
         except:
             log.warning("TensorFlow post-processing of loaded model was unsuccessful. "
                         "This is an optional step that Model Optimizer performs for any input model but it is not usually "
-                        "required for all models."
+                        "required for all models. "
                         "It likely means that the original model is ill-formed. "
                         "Model Optimizer will continue converting this model.")
 
diff --git a/model-optimizer/extensions/middle/StridedSliceNormalizer.py b/model-optimizer/extensions/middle/StridedSliceNormalizer.py
index bdf442e3efb..5ee58c8772b 100644
--- a/model-optimizer/extensions/middle/StridedSliceNormalizer.py
+++ b/model-optimizer/extensions/middle/StridedSliceNormalizer.py
@@ -198,7 +198,7 @@ class StridedSliceNormalizer(MiddleReplacementPattern):
                 # concat already exists
                 concat = node.in_port(i).get_source().node
                 last_in_port = max(concat.in_ports().keys())
-                assert not concat.in_port(last_in_port).disconnected(), 'The last in_port of Concat node {}' \
+                assert not concat.in_port(last_in_port).disconnected(), 'The last in_port of Concat node {} ' \
                                                                         'should be connected'. \
                     format(concat.soft_get('name', node.id))
 
diff --git a/model-optimizer/extensions/middle/TensorIteratorInput.py b/model-optimizer/extensions/middle/TensorIteratorInput.py
index 0b5124e74b7..e75f04130fe 100644
--- a/model-optimizer/extensions/middle/TensorIteratorInput.py
+++ b/model-optimizer/extensions/middle/TensorIteratorInput.py
@@ -131,7 +131,7 @@ class SmartInputMatcher(MiddleReplacementPattern):
             if shape['kind'] == 'op' and shape['op'] == 'Const':
                 start = 0
                 end = shape.value[0]
-                log.warning("Your network cannot be reshaped since shapes of placeholders are constants."
+                log.warning("Your network cannot be reshaped since shapes of placeholders are constants. "
                             "Please, provide non-constant shapes. ")
 
         # Create input node with params
diff --git a/model-optimizer/extensions/ops/If.py b/model-optimizer/extensions/ops/If.py
index e27bed71232..3ff40f4a73a 100644
--- a/model-optimizer/extensions/ops/If.py
+++ b/model-optimizer/extensions/ops/If.py
@@ -232,10 +232,10 @@ class If(Op):
         else_outputs = [node for node in if_node.else_graph.get_op_nodes() if node.has('output_id')]
         outputs_mapping = {}
         outputs_number = len(if_node.out_ports())
-        assert outputs_number == len(then_outputs), 'Incorrect number outputs in then_graph of If with"' \
+        assert outputs_number == len(then_outputs), 'Incorrect number outputs in then_graph of If with ' \
                                                     'name {0}! then_graph must has {1} outputs' \
             .format(if_node.name, outputs_number)
-        assert outputs_number == len(else_outputs), 'Incorrect number outputs in else_graph of If with"' \
+        assert outputs_number == len(else_outputs), 'Incorrect number outputs in else_graph of If with ' \
                                                     'name {0}! else_graph must has {1} outputs' \
             .format(if_node.name, outputs_number)
         for port_id in if_node.out_ports().keys():
diff --git a/model-optimizer/mo/back/offline_transformations.py b/model-optimizer/mo/back/offline_transformations.py
index e97b9826872..9ed124bba2b 100644
--- a/model-optimizer/mo/back/offline_transformations.py
+++ b/model-optimizer/mo/back/offline_transformations.py
@@ -18,8 +18,7 @@ def get_available_transformations():
 
 
 # net should be openvino.inference_engine.IENetwork type, but IE Engine is still optional dependency
-def apply_moc_transformations(net: object, transforms: list):
-    from openvino.offline_transformations import ApplyMOCTransformations  # pylint: disable=import-error,no-name-in-module
+def apply_user_transformations(net: object, transforms: list):
     available_transformations = get_available_transformations()
 
     for name, args in transforms:
@@ -28,6 +27,9 @@ def apply_moc_transformations(net: object, transforms: list):
 
         available_transformations[name](net, **args)
 
+
+def apply_moc_transformations(net: object):
+    from openvino.offline_transformations import ApplyMOCTransformations  # pylint: disable=import-error,no-name-in-module
     ApplyMOCTransformations(net, False)
 
 
@@ -40,7 +42,8 @@ def apply_offline_transformations(input_model: str, framework: str, transforms:
     from openvino.offline_transformations import GenerateMappingFile  # pylint: disable=import-error,no-name-in-module
 
     net = read_network(input_model + "_tmp.xml", input_model + "_tmp.bin")
-    apply_moc_transformations(net, transforms)
+    apply_user_transformations(net, transforms)
+    apply_moc_transformations(net)
     net.serialize(input_model + ".xml", input_model + ".bin")
     path_to_mapping = input_model + ".mapping"
     GenerateMappingFile(net, path_to_mapping.encode('utf-8'), extract_names)
diff --git a/model-optimizer/mo/front/caffe/extractor.py b/model-optimizer/mo/front/caffe/extractor.py
index 9be166bf174..822676d495e 100644
--- a/model-optimizer/mo/front/caffe/extractor.py
+++ b/model-optimizer/mo/front/caffe/extractor.py
@@ -87,7 +87,7 @@ def register_caffe_python_extractor(op: Op, name: str = None):
     if not name and hasattr(op, 'op'):
         name = op.op
     if not name:
-        raise Error("Can not register Op {}. Please, call function 'register_caffe_python_extractor'"
+        raise Error("Can not register Op {}. Please, call function 'register_caffe_python_extractor' "
                     "with parameter 'name' .".format(op),
                     refer_to_faq_msg(87))
     CaffePythonFrontExtractorOp.registered_ops[name] = lambda node: extension_op_extractor(node, op)
diff --git a/model-optimizer/mo/front/caffe/loader.py b/model-optimizer/mo/front/caffe/loader.py
index 14497c6108d..482ce3c1cbe 100644
--- a/model-optimizer/mo/front/caffe/loader.py
+++ b/model-optimizer/mo/front/caffe/loader.py
@@ -93,7 +93,7 @@ def load_caffe_proto_model(caffe_pb2, proto_path: str, model_path: [str, None] =
                            'Run: set PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=cpp \n'
         except ImportError:
             # 3. cpp implementation is not available
-            message += 'However you can use the C++ protobuf implementation that is supplied with the OpenVINO toolkit' \
+            message += 'However you can use the C++ protobuf implementation that is supplied with the OpenVINO toolkit ' \
                        'or build protobuf library from sources. \n' \
                        'Navigate to "install_prerequisites" folder and run: ' \
                        'python -m easy_install protobuf-3.5.1-py($your_python_version)-win-amd64.egg \n' \
diff --git a/model-optimizer/mo/graph/graph.py b/model-optimizer/mo/graph/graph.py
index c23e313f6c1..9109933bf51 100644
--- a/model-optimizer/mo/graph/graph.py
+++ b/model-optimizer/mo/graph/graph.py
@@ -147,7 +147,7 @@ class Node:
         for idx in self._in_ports:
             if control_flow or 'control_flow' not in self._in_ports[idx] or not self._in_ports[idx]['control_flow']:
                 ports.update({idx: self.in_port(idx, control_flow=control_flow)})
-        return dict_to_ordered_dict(ports, func=lambda t: str(t))
+        return dict_to_ordered_dict(ports, func=lambda t: int(str(t).replace('control_flow_', '')))
 
     def out_port(self, idx=None, control_flow=False) -> Port:
         if not self.has_valid('_out_ports'):
@@ -165,7 +165,7 @@ class Node:
         for idx in self._out_ports:
             if control_flow or 'control_flow' not in self._out_ports[idx] or not self._out_ports[idx]['control_flow']:
                 ports.update({idx: self.out_port(idx, control_flow=control_flow)})
-        return dict_to_ordered_dict(ports, func=lambda t: str(t))
+        return dict_to_ordered_dict(ports, func=lambda t: int(str(t).replace('control_flow_', '')))
 
     def has_port(self, port_type, idx, control_flow=False):
         assert port_type in ['in', 'out'], "Invalid usage of has_port method"
@@ -195,12 +195,14 @@ class Node:
 
     def in_nodes_edges(self, control_flow: bool = False):
         return dict_to_ordered_dict({x[1]['in']: (Node(self.graph, x[0]), x[1]) for x in
-                                     self.get_inputs(control_flow=control_flow)})
+                                     self.get_inputs(control_flow=control_flow)},
+                                    func=lambda t: int(str(t).replace('control_flow_', '')))
 
     def in_nodes(self, control_flow: bool = False):
         if self.kind == 'op':
             return dict_to_ordered_dict({x[1]['in']: Node(self.graph, x[0]) for x in
-                                         self.get_inputs(control_flow=control_flow)})
+                                         self.get_inputs(control_flow=control_flow)},
+                                        func=lambda t: int(str(t).replace('control_flow_', '')))
         elif self.kind == 'data':
             return [Node(self.graph, n) for n, d in self.get_inputs(control_flow=control_flow)]
 
@@ -211,20 +213,23 @@ class Node:
         assert self.has('kind')
         assert self.kind in ['op', 'data']
         if self.kind == 'op':
-            return dict_to_ordered_dict({x[1]['in']: x[1] for x in self.get_inputs(control_flow=control_flow)})
+            return dict_to_ordered_dict({x[1]['in']: x[1] for x in self.get_inputs(control_flow=control_flow)},
+                                        func=lambda t: int(str(t).replace('control_flow_', '')))
         elif self.kind == 'data':
             return [d for n, d in self.get_inputs(control_flow=control_flow)]
 
     def out_nodes_edges(self, control_flow: bool = False):
         return dict_to_ordered_dict({x[1]['out']: (Node(self.graph, x[0]), x[1]) for x in
-                                     self.get_outputs(control_flow=control_flow)})
+                                     self.get_outputs(control_flow=control_flow)},
+                                    func=lambda t: int(str(t).replace('control_flow_', '')))
 
     def out_nodes(self, control_flow: bool = False):
         assert self.has('kind')
         assert self.kind in ['op', 'data']
         if self.kind == 'op':
             return dict_to_ordered_dict({x[1]['out']: Node(self.graph, x[0]) for x in
-                                         self.get_outputs(control_flow=control_flow)})
+                                         self.get_outputs(control_flow=control_flow)},
+                                        func=lambda t: int(str(t).replace('control_flow_', '')))
         elif self.kind == 'data':
             return [Node(self.graph, n) for n, d in self.get_outputs(control_flow=control_flow)]
 
@@ -232,7 +237,8 @@ class Node:
         assert self.has('kind')
         assert self.kind in ['op', 'data']
         if self.kind == 'op':
-            return dict_to_ordered_dict({x[1]['out']: x[1] for x in self.get_outputs(control_flow=control_flow)})
+            return dict_to_ordered_dict({x[1]['out']: x[1] for x in self.get_outputs(control_flow=control_flow)},
+                                        func=lambda t: int(str(t).replace('control_flow_', '')))
         elif self.kind == 'data':
             return [d for n, d in self.get_outputs(control_flow=control_flow)]
 
diff --git a/model-optimizer/mo/main.py b/model-optimizer/mo/main.py
index 3a9553a2bc0..f3998be279e 100644
--- a/model-optimizer/mo/main.py
+++ b/model-optimizer/mo/main.py
@@ -96,7 +96,7 @@ def print_argv(argv: argparse.Namespace, is_caffe: bool, is_tf: bool, is_mxnet:
     print('\n'.join(lines), flush=True)
 
 
-def prepare_ir(argv: argparse.Namespace):
+def get_moc_frontends(argv: argparse.Namespace):
     fem = argv.feManager
     available_moc_front_ends = []
     moc_front_end = None
@@ -117,6 +117,12 @@ def prepare_ir(argv: argparse.Namespace):
             elif argv.framework in available_moc_front_ends:
                 moc_front_end = fem.load_by_framework(argv.framework)
 
+    return moc_front_end, available_moc_front_ends
+
+
+def arguments_post_parsing(argv: argparse.Namespace):
+    moc_front_end, available_moc_front_ends = get_moc_frontends(argv)
+
     is_tf, is_caffe, is_mxnet, is_kaldi, is_onnx =\
         deduce_framework_by_namespace(argv) if not moc_front_end else [False, False, False, False, False]
 
@@ -279,8 +285,15 @@ def prepare_ir(argv: argparse.Namespace):
         from mo.front.onnx.register_custom_ops import get_front_classes
         import_extensions.load_dirs(argv.framework, extensions, get_front_classes)
 
+    return argv
+
+
+def prepare_ir(argv):
+    argv = arguments_post_parsing(argv)
+
     graph = None
     ngraph_function = None
+    moc_front_end, available_moc_front_ends = get_moc_frontends(argv)
 
     if argv.framework not in available_moc_front_ends:
         graph = unified_pipeline(argv)
diff --git a/model-optimizer/mo/moc_frontend/serialize.py b/model-optimizer/mo/moc_frontend/serialize.py
index dd2533c6702..abe150742e1 100644
--- a/model-optimizer/mo/moc_frontend/serialize.py
+++ b/model-optimizer/mo/moc_frontend/serialize.py
@@ -15,8 +15,9 @@ def moc_emit_ir(ngraph_function: Function, argv: argparse.Namespace):
     output_dir = argv.output_dir if argv.output_dir != '.' else os.getcwd()
 
     network = function_to_cnn(ngraph_function)
-    from mo.back.offline_transformations import apply_moc_transformations
-    apply_moc_transformations(network, parse_transform(argv.transform))
+    from mo.back.offline_transformations import apply_user_transformations, apply_moc_transformations
+    apply_user_transformations(network, parse_transform(argv.transform))
+    apply_moc_transformations(network)
 
     orig_model_name = os.path.normpath(os.path.join(output_dir, argv.model_name))
     network.serialize(orig_model_name + ".xml", orig_model_name + ".bin")
diff --git a/model-optimizer/mo/utils/cli_parser.py b/model-optimizer/mo/utils/cli_parser.py
index bac0074c345..3481612eebd 100644
--- a/model-optimizer/mo/utils/cli_parser.py
+++ b/model-optimizer/mo/utils/cli_parser.py
@@ -528,7 +528,7 @@ def get_tf_cli_parser(parser: argparse.ArgumentParser = None):
                           action=CanonicalizePathCheckExistenceAction,
                           type=readable_file)
     tf_group.add_argument('--saved_model_dir', default=None,
-                          help='TensorFlow*: directory with a model in SavedModel format'
+                          help='TensorFlow*: directory with a model in SavedModel format '
                                'of TensorFlow 1.x or 2.x version.',
                           action=CanonicalizePathCheckExistenceAction,
                           type=readable_dirs)
@@ -949,7 +949,7 @@ def parse_tuple_pairs(argv_values: str):
 
     matches = [m for m in re.finditer(r'[(\[]([0-9., -]+)[)\]]', argv_values, re.IGNORECASE)]
 
-    error_msg = 'Mean/scale values should consist of name and values specified in round or square brackets' \
+    error_msg = 'Mean/scale values should consist of name and values specified in round or square brackets ' \
                 'separated by comma, e.g. data(1,2,3),info[2,3,4],egg[255] or data(1,2,3). Or just plain set of ' \
                 'values without names: (1,2,3),(2,3,4) or [1,2,3],[2,3,4].' + refer_to_faq_msg(101)
     if not matches:
diff --git a/model-optimizer/mo/utils/find_ie_version.py b/model-optimizer/mo/utils/find_ie_version.py
index af0df60dc20..7d6e8c87580 100644
--- a/model-optimizer/mo/utils/find_ie_version.py
+++ b/model-optimizer/mo/utils/find_ie_version.py
@@ -16,8 +16,13 @@ python_path_key = "PYTHONPATH"
 if python_path_key not in os.environ:
     os.environ[python_path_key] = ""
 
+ov_frontend_path_key = "OV_FRONTEND_PATH"
+if ov_frontend_path_key not in os.environ:
+    os.environ[ov_frontend_path_key] = ""
+
 lib_path_orig = os.environ[lib_env_key]
 python_path_orig = os.environ[python_path_key]
+ov_frontend_path_orig = os.environ[ov_frontend_path_key]
 
 
 def setup_env(module="", libs=[]):
@@ -28,8 +33,8 @@ def setup_env(module="", libs=[]):
     """
     os.environ[python_path_key] = os.pathsep.join([module, os.environ[python_path_key]])
     os.environ[lib_env_key] = os.pathsep.join([*libs, os.environ[lib_env_key]])
-    if not os.getenv("OV_FRONTEND_PATH"):
-        os.environ["OV_FRONTEND_PATH"] = os.pathsep.join([*libs, os.environ[lib_env_key]])
+    if len(os.getenv(ov_frontend_path_key)) == 0:
+        os.environ[ov_frontend_path_key] = os.pathsep.join([*libs])
 
 
 def reset_env():
@@ -38,6 +43,7 @@ def reset_env():
     """
     os.environ[python_path_key] = python_path_orig
     os.environ[lib_env_key] = lib_path_orig
+    os.environ[ov_frontend_path_key] = ov_frontend_path_orig
 
 
 def try_to_import_ie(module="", libs=[], silent=False):
diff --git a/model-optimizer/unit_tests/mo/front/caffe/loader_test.py b/model-optimizer/unit_tests/mo/front/caffe/loader_test.py
index 1c80f7985a3..3dd791e22aa 100644
--- a/model-optimizer/unit_tests/mo/front/caffe/loader_test.py
+++ b/model-optimizer/unit_tests/mo/front/caffe/loader_test.py
@@ -32,7 +32,7 @@ proto_str_old_styled_multi_input = 'name: "network" ' \
                                    'input_dim: 3 ' \
                                    'input_dim: 224 ' \
                                    'input_dim: 224 ' \
-                                   'input: "data"' \
+                                   'input: "data" ' \
                                    'input_dim: 1 ' \
                                    'input_dim: 3 '
 
@@ -55,7 +55,7 @@ proto_str_multi_input = 'name: "network" ' \
                         'dim: 224 ' \
                         'dim: 224 ' \
                         '} ' \
-                        'input: "data1"' \
+                        'input: "data1" ' \
                         'input_shape ' \
                         '{ ' \
                         'dim: 1 ' \
@@ -81,7 +81,7 @@ proto_same_name_layers = 'layer { ' \
                          'type: "Convolution" ' \
                          'bottom: "data" ' \
                          'top: "conv1" ' \
-                         '}' \
+                         '} ' \
                          'layer { ' \
                          'name: "conv1" ' \
                          'type: "Convolution" ' \
diff --git a/model-optimizer/unit_tests/mo/frontend_ngraph_test_actual.py b/model-optimizer/unit_tests/mo/frontend_ngraph_test_actual.py
index cb87a052e61..ab68eecf8a2 100644
--- a/model-optimizer/unit_tests/mo/frontend_ngraph_test_actual.py
+++ b/model-optimizer/unit_tests/mo/frontend_ngraph_test_actual.py
@@ -29,7 +29,7 @@ try:
     from ngraph.utils.types import get_element_type
 
 except Exception:
-    print("No mock frontend API available,"
+    print("No mock frontend API available, "
           "ensure to use -DENABLE_TESTS=ON option when running these tests")
     mock_available = False
 
diff --git a/model-optimizer/unit_tests/mo/graph/graph_test.py b/model-optimizer/unit_tests/mo/graph/graph_test.py
index 731b6c1430c..72e4cab6e0e 100644
--- a/model-optimizer/unit_tests/mo/graph/graph_test.py
+++ b/model-optimizer/unit_tests/mo/graph/graph_test.py
@@ -11,7 +11,7 @@ from mo.graph.graph import Node, Graph, add_opoutput, dict_includes_compare_attr
 from mo.ops.const import Const
 from mo.utils.error import Error
 from mo.utils.ir_engine.compare_graphs import compare_graphs
-from unit_tests.utils.graph import build_graph
+from unit_tests.utils.graph import build_graph, build_graph_with_edge_attrs
 
 nodes = {
     '0': {'name': 'input1', 'type': 'Identity', 'value': None, 'kind': 'op', 'op': 'Parameter'},
@@ -429,6 +429,20 @@ class TestNewGraphAPIMiddle(unittest.TestCase):
         'const_1_data': {'value': None, 'shape': None, 'kind': 'data'},
     }
 
+    nodes_10_in_10_out = {
+        'op_concat': {'type': 'Concat', 'value': None, 'kind': 'op', 'op': 'Concat'},
+        'op_concat_data': {'value': None, 'shape': None, 'kind': 'data'},
+
+        'op_split': {'type': 'Split', 'value': None, 'kind': 'op', 'op': 'Split'},
+    }
+
+    # Filling nodes list
+    for idx in range(11):
+        nodes_10_in_10_out.update({'in_{}'.format(idx): {'type': 'Parameter', 'value': None, 'kind': 'op', 'op': 'Parameter'}})
+        nodes_10_in_10_out.update({'in_{}_data'.format(idx): {'value': None, 'shape': None, 'kind': 'data'}})
+        nodes_10_in_10_out.update({'out_{}'.format(idx): {'type': 'Parameter', 'value': None, 'kind': 'op', 'op': 'Parameter'}})
+        nodes_10_in_10_out.update({'op_split_{}_data'.format(idx): {'value': None, 'shape': None, 'kind': 'data'}})
+
       ###########################################
      ###### TESTS FOR PORT CLASS METHODS #######
     ###########################################
@@ -1083,6 +1097,113 @@ class TestNewGraphAPIMiddle(unittest.TestCase):
             for idx in range(len(node.out_ports())):
                 self.assertEqual(node.out_port(idx), node.out_ports()[idx])
 
+    def test_node_in_ports_order_10_inputs(self):
+        edges = [('op_concat', 'op_concat_data'),
+                 ('op_concat_data', 'op_split'),
+                 ]
+
+        # Filling edges list
+        for idx in range(11):
+            edges.append(('in_{}'.format(idx), 'in_{}_data'.format(idx)))
+            edges.append(('in_{}_data'.format(idx), 'op_concat', {'in': idx}))
+            edges.append(('op_split', 'op_split_{}_data'.format(idx), {'out': idx}))
+            edges.append(('op_split_{}_data'.format(idx), 'out_{}'.format(idx)))
+
+        graph = build_graph(self.nodes_10_in_10_out, edges)
+
+        node_concat = Node(graph, 'op_concat')
+        node_split = Node(graph, 'op_split')
+
+        self.assertEqual(len(node_concat.in_ports()), len(node_concat.in_nodes()))
+
+        l1 = [node_concat.in_port(idx).get_source().node.name for idx in node_concat.in_ports()]
+        l2 = [node_concat.in_node(idx).in_node(0).name for idx in node_concat.in_nodes()]
+
+        self.assertEqual(l1, l2)
+
+        l1 = [node_split.out_port(idx).get_destination().node.name for idx in node_split.out_ports()]
+        l2 = [node_split.out_node(idx).out_node(0).name for idx in node_split.out_nodes()]
+
+        self.assertEqual(l1, l2)
+
+    def test_node_in_ports_order_10_inputs_control_flow(self):
+        edges = [('op_concat', 'op_concat_data', {'out': 'control_flow_0', 'control_flow_edge': True}),
+                 ('op_concat_data', 'op_split', {'in': 'control_flow_0', 'control_flow_edge': True}),
+                 ]
+
+        # Filling edges list
+        for idx in range(11):
+            edges.append(('in_{}'.format(idx), 'in_{}_data'.format(idx),
+                          {'out': 'control_flow_0', 'control_flow_edge': True}))
+            edges.append(('in_{}_data'.format(idx), 'op_concat',
+                          {'in': 'control_flow_{}'.format(idx), 'control_flow_edge': True}))
+            edges.append(('op_split', 'op_split_{}_data'.format(idx),
+                          {'out': 'control_flow_{}'.format(idx), 'control_flow_edge': True}))
+            edges.append(('op_split_{}_data'.format(idx), 'out_{}'.format(idx),
+                          {'in': 'control_flow_0', 'control_flow_edge': True}))
+
+        graph = build_graph(self.nodes_10_in_10_out, edges)
+
+        node_concat = Node(graph, 'op_concat')
+        node_split = Node(graph, 'op_split')
+
+        self.assertEqual(len(node_concat.in_ports()), len(node_concat.in_nodes()))
+
+        l1 = [node_concat.in_port(idx, control_flow=True).get_source().node.name
+              for idx in node_concat.in_ports(control_flow=True)]
+        l2 = [node_concat.in_node(idx, control_flow=True).in_node(0, control_flow=True).name
+              for idx in node_concat.in_nodes(control_flow=True)]
+
+        self.assertEqual(l1, l2)
+
+        l1 = [node_split.out_port(idx, control_flow=True).get_destination().node.name
+              for idx in node_split.out_ports(control_flow=True)]
+        l2 = [node_split.out_node(idx, control_flow=True).out_node(0, control_flow=True).name for idx in
+              node_split.out_nodes(control_flow=True)]
+
+        self.assertEqual(l1, l2)
+
+    def test_node_in_ports_order_10_inputs_mixed(self):
+        edges = [('op_concat', 'op_concat_data', {'out': 'control_flow_0', 'control_flow_edge': True}),
+                 ('op_concat_data', 'op_split', {'in': 'control_flow_0', 'control_flow_edge': True}),
+                 ]
+        graph = build_graph(self.nodes_10_in_10_out, edges)
+
+        # Filling edges list
+        for idx in range(5):
+            edges.append(('in_{}'.format(idx), 'in_{}_data'.format(idx)))
+            edges.append(('in_{}_data'.format(idx), 'op_concat'))
+            edges.append(('op_split', 'op_split_{}_data'.format(idx)))
+            edges.append(('op_split_{}_data'.format(idx), 'out_{}'.format(idx)))
+        for idx in range(5, 11):
+            edges.append(('in_{}'.format(idx), 'in_{}_data'.format(idx),
+                          {'out': 'control_flow_0', 'control_flow_edge': True}))
+            edges.append(('in_{}_data'.format(idx), 'op_concat',
+                          {'in': 'control_flow_{}', 'control_flow_edge': True}))
+            edges.append(('op_split', 'op_split_{}_data'.format(idx),
+                          {'out': 'control_flow_{}', 'control_flow_edge': True}))
+            edges.append(('op_split_{}_data'.format(idx), 'out_{}'.format(idx),
+                          {'in': 'control_flow_0', 'control_flow_edge': True}))
+
+        node_concat = Node(graph, 'op_concat')
+        node_split = Node(graph, 'op_split')
+
+        self.assertEqual(len(node_concat.in_ports()), len(node_concat.in_nodes()))
+
+        l1 = [node_concat.in_port(idx, control_flow=True).get_source().node.name
+              for idx in node_concat.in_ports(control_flow=True)]
+        l2 = [node_concat.in_node(idx, control_flow=True).in_node(0, control_flow=True).name
+              for idx in node_concat.in_nodes(control_flow=True)]
+
+        self.assertEqual(l1, l2)
+
+        l1 = [node_split.out_port(idx, control_flow=True).get_destination().node.name
+              for idx in node_split.out_ports(control_flow=True)]
+        l2 = [node_split.out_node(idx, control_flow=True).out_node(0, control_flow=True).name for idx in
+              node_split.out_nodes(control_flow=True)]
+
+        self.assertEqual(l1, l2)
+
 
 class TestNewGraphAPIFront(unittest.TestCase):
     nodes = {
diff --git a/model-optimizer/unit_tests/mo/moc_frontend/moc_extractor_test_actual.py b/model-optimizer/unit_tests/mo/moc_frontend/moc_extractor_test_actual.py
index 17ac755c4d1..3ca2e6b9431 100644
--- a/model-optimizer/unit_tests/mo/moc_frontend/moc_extractor_test_actual.py
+++ b/model-optimizer/unit_tests/mo/moc_frontend/moc_extractor_test_actual.py
@@ -21,7 +21,7 @@ try:
     from ngraph.frontend import FrontEndManager
 
 except Exception:
-    print("No mock frontend API available,"
+    print("No mock frontend API available, "
           "ensure to use -DENABLE_TESTS=ON option when running these tests")
     mock_available = False
 
diff --git a/model-optimizer/unit_tests/utils/graph.py b/model-optimizer/unit_tests/utils/graph.py
index 4360e4c2844..1cb67bcd2ba 100644
--- a/model-optimizer/unit_tests/utils/graph.py
+++ b/model-optimizer/unit_tests/utils/graph.py
@@ -190,14 +190,16 @@ def build_graph(nodes_attrs: dict, edges: list, update_attributes: dict = None,
 
     for node in graph.get_op_nodes():
         # Add in_ports attribute
-        in_edges = node.in_edges()
+        in_edges = node.in_edges(control_flow=True)
         for attr in in_edges.values():
-            node.add_input_port(idx=attr['in'])
+            control_flow = True if 'control_flow_edge' in attr and attr['control_flow_edge'] is True else False
+            node.add_input_port(idx=attr['in'], control_flow=control_flow)
 
         # Add out_ports attribute
-        out_edges = node.out_edges()
+        out_edges = node.out_edges(control_flow=True)
         for attr in out_edges.values():
-            node.add_output_port(idx=attr['out'])
+            control_flow = True if 'control_flow_edge' in attr and attr['control_flow_edge'] is True else False
+            node.add_output_port(idx=attr['out'], control_flow=control_flow)
 
     graph.graph['cmd_params'] = cli
     return graph
diff --git a/ngraph/core/CMakeLists.txt b/ngraph/core/CMakeLists.txt
index 726bc4c7402..8f9772091d5 100644
--- a/ngraph/core/CMakeLists.txt
+++ b/ngraph/core/CMakeLists.txt
@@ -39,7 +39,7 @@ if(COMMAND ie_add_vs_version_file)
                            FILEDESCRIPTION "nGraph library")
 endif()
 
-target_link_libraries(ngraph PRIVATE ngraph::builder ngraph::reference)
+target_link_libraries(ngraph PRIVATE ngraph::builder ngraph::reference openvino::util)
 
 ie_mark_target_as_cc(ngraph)
 
diff --git a/ngraph/core/include/ngraph/compatibility.hpp b/ngraph/core/include/ngraph/compatibility.hpp
new file mode 100644
index 00000000000..0b06822a193
--- /dev/null
+++ b/ngraph/core/include/ngraph/compatibility.hpp
@@ -0,0 +1,27 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <utility>
+
+#include "ngraph/deprecated.hpp"
+
+namespace ngraph {
+
+// If operation has type_info, use it to add operation to opset
+template <class T>
+class HasTypeInfoMember {
+    template <typename U>
+    static std::false_type check(...);
+    NGRAPH_SUPPRESS_DEPRECATED_START
+    template <typename U>
+    static auto check(int) -> decltype(std::declval<U>().type_info, std::true_type{});
+    using type = decltype(check<T>(0));
+    NGRAPH_SUPPRESS_DEPRECATED_END
+public:
+    static constexpr bool value = type::value;
+};
+
+}  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/factory.hpp b/ngraph/core/include/ngraph/factory.hpp
index 4ed341a8813..503462fe899 100644
--- a/ngraph/core/include/ngraph/factory.hpp
+++ b/ngraph/core/include/ngraph/factory.hpp
@@ -8,6 +8,8 @@
 #include <mutex>
 #include <unordered_map>
 
+#include "ngraph/compatibility.hpp"
+#include "ngraph/deprecated.hpp"
 #include "ngraph/ngraph_visibility.hpp"
 
 namespace ngraph {
@@ -35,9 +37,17 @@ public:
     }
 
     /// \brief Register a custom factory for DERIVED_TYPE
-    template <typename DERIVED_TYPE>
+    template <typename DERIVED_TYPE,
+              typename std::enable_if<!HasTypeInfoMember<DERIVED_TYPE>::value, bool>::type = true>
     void register_factory(Factory factory) {
+        register_factory(DERIVED_TYPE::get_type_info_static(), factory);
+    }
+
+    template <typename DERIVED_TYPE, typename std::enable_if<HasTypeInfoMember<DERIVED_TYPE>::value, bool>::type = true>
+    void register_factory(Factory factory) {
+        NGRAPH_SUPPRESS_DEPRECATED_START
         register_factory(DERIVED_TYPE::type_info, factory);
+        NGRAPH_SUPPRESS_DEPRECATED_END
     }
 
     /// \brief Register the defualt constructor factory for DERIVED_TYPE
@@ -53,9 +63,17 @@ public:
     }
 
     /// \brief Check to see if DERIVED_TYPE has a registered factory
-    template <typename DERIVED_TYPE>
+    template <typename DERIVED_TYPE,
+              typename std::enable_if<!HasTypeInfoMember<DERIVED_TYPE>::value, bool>::type = true>
     bool has_factory() {
+        return has_factory(DERIVED_TYPE::get_type_info_static());
+    }
+
+    template <typename DERIVED_TYPE, typename std::enable_if<HasTypeInfoMember<DERIVED_TYPE>::value, bool>::type = true>
+    bool has_factory() {
+        NGRAPH_SUPPRESS_DEPRECATED_START
         return has_factory(DERIVED_TYPE::type_info);
+        NGRAPH_SUPPRESS_DEPRECATED_END
     }
 
     /// \brief Create an instance for type_info
@@ -66,9 +84,17 @@ public:
     }
 
     /// \brief Create an instance using factory for DERIVED_TYPE
-    template <typename DERIVED_TYPE>
+    template <typename DERIVED_TYPE,
+              typename std::enable_if<!HasTypeInfoMember<DERIVED_TYPE>::value, bool>::type = true>
     BASE_TYPE* create() const {
+        return create(DERIVED_TYPE::get_type_info_static());
+    }
+
+    template <typename DERIVED_TYPE, typename std::enable_if<HasTypeInfoMember<DERIVED_TYPE>::value, bool>::type = true>
+    BASE_TYPE* create() const {
+        NGRAPH_SUPPRESS_DEPRECATED_START
         return create(DERIVED_TYPE::type_info);
+        NGRAPH_SUPPRESS_DEPRECATED_END
     }
 
 protected:
diff --git a/ngraph/core/include/ngraph/graph_util.hpp b/ngraph/core/include/ngraph/graph_util.hpp
index 7a3900dd10f..5e7c19fb476 100644
--- a/ngraph/core/include/ngraph/graph_util.hpp
+++ b/ngraph/core/include/ngraph/graph_util.hpp
@@ -17,6 +17,7 @@
 #include "ngraph/check.hpp"
 #include "ngraph/function.hpp"
 #include "ngraph/node.hpp"
+#include "openvino/core/graph_util.hpp"
 
 namespace ov {
 namespace op {
@@ -33,249 +34,19 @@ using ov::op::v0::Parameter;
 }
 }  // namespace op
 
-NGRAPH_API
-void traverse_nodes(const std::shared_ptr<const Function> p, std::function<void(std::shared_ptr<Node>)> f);
-
-NGRAPH_API
-void traverse_nodes(const Function* p, std::function<void(std::shared_ptr<Node>)> f);
-
-/// \brief Visit each node in a sub-graph of the entire graph
-/// \param subgraph_results The output nodes of the sub-graph
-/// \param f Function to execute at each node in the traversal
-/// \param subgraph_params Input nodes of the sub-graph (optional)
-///
-/// Traverses a sub-graph starting from subgraph_results moving up
-/// towards parameter nodes. Traversal stops if it hits a node in
-/// subgraph_params.
-///
-/// Most useful for finding parameters of a graph directly from the
-/// result nodes and not from function parameters or extracting a
-/// subgraph relevant to the computation of certain outputs
-NGRAPH_API
-void traverse_nodes(const NodeVector& subgraph_results,
-                    std::function<void(std::shared_ptr<Node>)> f,
-                    const NodeVector& subgraph_params = {});
-
-/// \brief Replace the node `target` with the node `replacement`, i.e.,
-///        redirect all users and control dependencies of `target` to
-///        `replacement`.
-///
-/// \param target Node to be replaced.
-/// \param replacement Node to replace `target` with.
-/// \param output_order Vector determines order of replacement node's outputs.
-///
-/// This is primarily used in graph-rewriting passes. For example, we
-/// might "fuse" two Concat operations as follows:
-///
-/// (Step 0: Original graph)
-///
-///   A                       B
-///   |                       |
-///   v                       v
-/// N0[Concat, concatenation_axis=3]     C
-///          |                           |
-///          v                           v
-///        N1[Concat, concatenation_axis=3]
-///          |                |
-///          v                v
-///       some_user         another_user
-///
-/// (Step 1: Construct replacement)
-///
-///    shared_ptr<Node> new_N1 = make_shared<op::Concat>({A,B,C},3);
-///
-///   A----------------------------------------.
-///   |                                        |
-///   |                       B----------------)--.
-///   |                       |                |  |
-///   v                       v                |  |
-/// N0[Concat, concatenation_axis=3]     C-----)--)--.
-///          |                           |     |  |  |
-///          v                           v     v  v  v
-///        N1[Concat, concatenation_axis=3]   new_N1[Concat, concatenation_axis=3]
-///          |                |
-///          v                v
-///       some_user         another_user
-///
-/// (Step 2: Replace N1 with new_N1)
-///
-///    replace_node(N1, new_N1);
-///
-///   A----------------------------------------.
-///   |                                        |
-///   |                       B----------------)--.
-///   |                       |                |  |
-///   v                       v                |  |
-/// N0[Concat, concatenation_axis=3]     C-----)--)--.
-///          |                           |     |  |  |
-///          v                           v     v  v  v
-///        N1[Concat, concatenation_axis=3]   new_N1[Concat, concatenation_axis=3]
-///                                                  |                |
-///                                                  v                v
-///                                               some_user         another_user
-///
-/// (Step 3: N0 and N1 are now dead, nodes will be freed)
-///
-///    [happens automatically, once all shared_ptrs to N1 are released]
-///
-///   A----------------------------------------.
-///                                            |
-///                           B----------------)--.
-///                                            |  |
-///                                            |  |
-///                                      C-----)--)--.
-///                                            |  |  |
-///                                            v  v  v
-///                                           new_N1[Concat, concatenation_axis=3]
-///                                                  |                |
-///                                                  v                v
-///                                               some_user         another_user
-///
-/// NOTE 1: replace_node is not type-safe (the graph is not revalidated).
-/// For example, the following is allowed, even if node `some_user`
-/// requires an input of shape 2x2:
-///
-/// (Before)
-///      A(shape=2x2)  B(shape=3x3)
-///      |
-///      v
-///   some_user(requires 2x2 input)
-///
-/// (After -- graph is now invalid)
-///
-///      replace_node(A, B);
-///
-///      A(shape=2x2)  B(shape=3x3)
-///                    |
-///                    v
-///                 some_user(requires 2x2 input)
-///
-/// NOTE 2: it is possible to insert a cycle into the graph with
-/// replace_node, resulting in an invalid graph. Care must be taken to
-/// avoid this. One common example is when you are attempting to insert a
-/// new node `M` "after"` a node `N`. For example, you might expect this
-/// to work:
-///
-///    shared_ptr<Node> M = make_shared<SomeUnaryOp>(N);
-///    replace_node(M, N);
-///
-/// The problem is that at replacement time, N itself is a user of M. So
-/// we end up introducing a cycle as follows:
-///
-///       N
-///       |
-///       v
-///  other users...
-///
-///      |||
-///      vvv
-///
-///       N------------>M
-///       |
-///       v
-///  other users...
-///
-///      |||
-///      vvv
-///
-///               .----.
-///              |      |
-///              |      |
-///       N      `----->M
-///                     |
-///                     v
-///                other users...
-///
-/// To avoid the cycle, a valid way to perform the above desired insertion would be,
-///
-///        auto new_N = N->clone_with_new_inputs(N->input_values());
-///        shared_ptr<Node> M = make_shared<SomeUnaryOp>(new_N);
-///        replace_node(N, M);
-NGRAPH_API
-void replace_node(std::shared_ptr<Node> target,
-                  std::shared_ptr<Node> replacement,
-                  const std::vector<int64_t>& output_order);
-
-/// Replace target.outputs[i] with replacement_values[i] and transfer control dependents and
-/// provenance from target to the node(s) in replacement_values.
-NGRAPH_API
-void replace_node(const std::shared_ptr<Node>& target, const OutputVector& replacement_values);
-
-NGRAPH_API
-void replace_node(std::shared_ptr<Node> target, std::shared_ptr<Node> replacement);
-
-/// \brief Replace multiple nodes in a function.
-/// \param f Function where replacement is taking place.
-/// \param parameter_replacement_map A mapping from parameter shared pointers to parameter
-///                                  shared pointers. For each pair (k,v) in the map, parameter
-///                                  k is replaced by parameter v, except if k==v or k is not a
-///                                  parameter bound by f, in which case the pair (k,v) is
-///                                  ignored.
-/// \param body_replacement_map A mapping from node shared pointers to node shared pointers.
-///                             For each pair (k,v) in the map, node k is replaced by node v,
-///                             except if k==v, the pair (k,v) is ignored.
-///                             Note that if k is a parameter, its users will be redirected to
-///                             v, but k will _not_ be replaced in the function's parameter
-///                             list.
-///
-/// Limitations:
-///
-///    - No check is made that the replaced nodes in `parameter_replacement_map` are actually
-///      among the bound parameters of `f`. (If a parameter appears in the map that is not
-///      bound by `f`, it will be silently ignored.)
-///    - If a parameter node appears as a key in both `parameter_replacement_map` _and_ in
-///      `body_replacement_map`, behavior is unspecified.
-NGRAPH_API
-void replace_nodes(const std::shared_ptr<Function>& f,
-                   const std::unordered_map<std::shared_ptr<op::v0::Parameter>, std::shared_ptr<op::v0::Parameter>>&
-                       parameter_replacement_map,
-                   const std::unordered_map<std::shared_ptr<Node>, std::shared_ptr<Node>>& body_replacement_map);
+using ov::clone_function;
+using ov::compare_constants;
+using ov::replace_node;
+using ov::replace_node_update_name;
+using ov::replace_nodes;
+using ov::replace_output_update_name;
+using ov::topological_sort;
+using ov::traverse_nodes;
 
 NGRAPH_DEPRECATED("This method is deprecated and will be removed soon")
 NGRAPH_API
 NodeVector find_common_args(std::shared_ptr<Node> target, std::shared_ptr<Node> replacement);
 
-/// Topological sort of nodes needed to compute root_nodes
-template <typename T>
-std::vector<std::shared_ptr<Node>> topological_sort(T root_nodes) {
-    std::stack<Node*, std::vector<Node*>> nodes_to_do;
-    std::unordered_set<Node*> nodes_done;
-    std::vector<std::shared_ptr<Node>> result;
-
-    for (auto& node : root_nodes) {
-        nodes_to_do.push(node.get());
-    }
-    while (nodes_to_do.size() > 0) {
-        Node* node = nodes_to_do.top();
-        if (nodes_done.count(node) == 0) {
-            bool can_add = true;
-            size_t arg_count = node->get_input_size();
-            for (size_t i = 0; i < arg_count; ++i) {
-                Node* dep = node->get_input_node_ptr(arg_count - i - 1);
-                if (nodes_done.count(dep) == 0) {
-                    can_add = false;
-                    nodes_to_do.push(dep);
-                }
-            }
-            for (auto& depptr : node->get_control_dependencies()) {
-                Node* dep = depptr.get();
-                if (nodes_done.count(dep) == 0) {
-                    can_add = false;
-                    nodes_to_do.push(dep);
-                }
-            }
-            if (can_add) {
-                result.push_back(node->shared_from_this());
-                nodes_to_do.pop();
-                nodes_done.insert(node);
-            }
-        } else {
-            nodes_to_do.pop();
-        }
-    }
-    return result;
-}
-
 /// Topological sort of just nodes
 template <typename T>
 std::vector<std::shared_ptr<Node>> subgraph_topological_sort(T nodes) {
@@ -356,16 +127,6 @@ NGRAPH_API
 std::list<std::shared_ptr<ngraph::Node>> clone_nodes(const std::vector<std::shared_ptr<ngraph::Node>>& nodes,
                                                      RawNodeOutputMap& node_map);
 
-// input function is cloned and returned
-// NodeMap input may contain default node mapping i.e. pre-cloned nodes
-// NodeMap output (by reference) fully maps input and cloned function ops
-NGRAPH_API
-std::shared_ptr<ngraph::Function> clone_function(const ngraph::Function& func, NodeMap& node_map);
-
-// input function is cloned and returned
-NGRAPH_API
-std::shared_ptr<ngraph::Function> clone_function(const ngraph::Function& func);
-
 NGRAPH_DEPRECATED("This method is deprecated and will be removed soon")
 NGRAPH_API
 std::pair<std::shared_ptr<op::Result>, std::shared_ptr<op::v0::Parameter>> insert_result_parameter_split(
@@ -406,9 +167,6 @@ NGRAPH_DEPRECATED("This method is deprecated and will be removed soon")
 NGRAPH_API
 bool is_one(const Output<Node>& reduce_constant);
 
-NGRAPH_API
-bool compare_constants(const std::shared_ptr<Node>& n1, const std::shared_ptr<Node>& n2);
-
 // Returns true if `node` is live in the graph i.e. a result op
 // transitively uses this `node`
 NGRAPH_API
@@ -456,12 +214,6 @@ std::vector<Output<Node>> get_outputs_to(Node& src, Node& dst);
 NGRAPH_DEPRECATED("This method is deprecated and will be removed soon")
 NGRAPH_API
 bool check_for_cycles(const ngraph::Function* func, ngraph::NodeVector& cycle_nodes, bool& is_bkwd_cycle);
-
-NGRAPH_API
-bool replace_output_update_name(Output<Node> node, const Output<Node>& node_input);
-
-NGRAPH_API
-bool replace_node_update_name(std::shared_ptr<Node> target, std::shared_ptr<Node> replacement);
 }  // namespace ngraph
 
 using ngraph::replace_node;
diff --git a/ngraph/core/include/ngraph/log.hpp b/ngraph/core/include/ngraph/log.hpp
index 858770683d3..80f529f78a3 100644
--- a/ngraph/core/include/ngraph/log.hpp
+++ b/ngraph/core/include/ngraph/log.hpp
@@ -120,7 +120,7 @@ void default_logger_handler_func(const std::string& s);
                       ngraph::default_logger_handler_func)                \
         .stream()
 
-#ifdef NGRAPH_DEBUG_ENABLE
+#ifdef OPENVINO_DEBUG_ENABLE
 #    define NGRAPH_DEBUG                                                      \
         ngraph::LogHelper(ngraph::LOG_TYPE::_LOG_TYPE_DEBUG,                  \
                           ngraph::trim_file_name(PROJECT_ROOT_DIR, __FILE__), \
diff --git a/ngraph/core/include/ngraph/opsets/opset.hpp b/ngraph/core/include/ngraph/opsets/opset.hpp
index 039abf863d7..b7eecd1876a 100644
--- a/ngraph/core/include/ngraph/opsets/opset.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset.hpp
@@ -34,11 +34,16 @@ public:
     }
 
     /// \brief Insert OP_TYPE into the opset with the default name and factory
-    template <typename OP_TYPE>
+    template <typename OP_TYPE, typename std::enable_if<ngraph::HasTypeInfoMember<OP_TYPE>::value, bool>::type = true>
     void insert() {
         ov::OpSet::insert<OP_TYPE>(OP_TYPE::type_info.name);
     }
 
+    template <typename OP_TYPE, typename std::enable_if<!ngraph::HasTypeInfoMember<OP_TYPE>::value, bool>::type = true>
+    void insert() {
+        ov::OpSet::insert<OP_TYPE>(OP_TYPE::get_type_info_static().name);
+    }
+
     ngraph::FactoryRegistry<ngraph::Node>& get_factory_registry() {
         return m_factory_registry;
     }
diff --git a/ngraph/core/include/ngraph/opsets/opset1_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset1_tbl.hpp
index 3a088f9eb66..ed536778577 100644
--- a/ngraph/core/include/ngraph/opsets/opset1_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset1_tbl.hpp
@@ -38,6 +38,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-#define OPENVINO_OP NGRAPH_OP
+#define _OPENVINO_OP_REG NGRAPH_OP
 #include "openvino/opsets/opset1_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
diff --git a/ngraph/core/include/ngraph/opsets/opset2_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset2_tbl.hpp
index 3dc125d1daf..c604c7bc1fd 100644
--- a/ngraph/core/include/ngraph/opsets/opset2_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset2_tbl.hpp
@@ -7,6 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-#define OPENVINO_OP NGRAPH_OP
+#define _OPENVINO_OP_REG NGRAPH_OP
 #include "openvino/opsets/opset2_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
diff --git a/ngraph/core/include/ngraph/opsets/opset3_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset3_tbl.hpp
index eccbdc2e64c..ff2a77ef56f 100644
--- a/ngraph/core/include/ngraph/opsets/opset3_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset3_tbl.hpp
@@ -7,6 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-#define OPENVINO_OP NGRAPH_OP
+#define _OPENVINO_OP_REG NGRAPH_OP
 #include "openvino/opsets/opset3_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
diff --git a/ngraph/core/include/ngraph/opsets/opset4_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset4_tbl.hpp
index 70744995c9e..209a2332589 100644
--- a/ngraph/core/include/ngraph/opsets/opset4_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset4_tbl.hpp
@@ -7,6 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-#define OPENVINO_OP NGRAPH_OP
+#define _OPENVINO_OP_REG NGRAPH_OP
 #include "openvino/opsets/opset4_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
diff --git a/ngraph/core/include/ngraph/opsets/opset5_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset5_tbl.hpp
index 2e4b6ad7288..67d869436ee 100644
--- a/ngraph/core/include/ngraph/opsets/opset5_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset5_tbl.hpp
@@ -7,6 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-#define OPENVINO_OP NGRAPH_OP
+#define _OPENVINO_OP_REG NGRAPH_OP
 #include "openvino/opsets/opset5_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
diff --git a/ngraph/core/include/ngraph/opsets/opset6_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset6_tbl.hpp
index e9cb2a0c12a..f6a309fbc63 100644
--- a/ngraph/core/include/ngraph/opsets/opset6_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset6_tbl.hpp
@@ -7,6 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-#define OPENVINO_OP NGRAPH_OP
+#define _OPENVINO_OP_REG NGRAPH_OP
 #include "openvino/opsets/opset6_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
diff --git a/ngraph/core/include/ngraph/opsets/opset7_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset7_tbl.hpp
index 02802da1b94..7a99c4769c7 100644
--- a/ngraph/core/include/ngraph/opsets/opset7_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset7_tbl.hpp
@@ -7,6 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-#define OPENVINO_OP NGRAPH_OP
+#define _OPENVINO_OP_REG NGRAPH_OP
 #include "openvino/opsets/opset7_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
diff --git a/ngraph/core/include/ngraph/opsets/opset8_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset8_tbl.hpp
index a57cb4318da..32074badb82 100644
--- a/ngraph/core/include/ngraph/opsets/opset8_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset8_tbl.hpp
@@ -7,6 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-#define OPENVINO_OP NGRAPH_OP
+#define _OPENVINO_OP_REG NGRAPH_OP
 #include "openvino/opsets/opset8_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
diff --git a/ngraph/core/include/ngraph/util.hpp b/ngraph/core/include/ngraph/util.hpp
index d5a85793e5f..b7554c58e12 100644
--- a/ngraph/core/include/ngraph/util.hpp
+++ b/ngraph/core/include/ngraph/util.hpp
@@ -190,6 +190,7 @@ NGRAPH_DEPRECATED("This method is deprecated and will be removed soon")
 void ngraph_free(void*);
 
 NGRAPH_API
+NGRAPH_DEPRECATED("This method is deprecated and will be removed soon")
 size_t round_up(size_t size, size_t alignment);
 
 NGRAPH_DEPRECATED("This method is deprecated and will be removed soon")
diff --git a/ngraph/core/include/ngraph/validation_util.hpp b/ngraph/core/include/ngraph/validation_util.hpp
index 560a6c3b164..e52b6096c5d 100644
--- a/ngraph/core/include/ngraph/validation_util.hpp
+++ b/ngraph/core/include/ngraph/validation_util.hpp
@@ -11,8 +11,16 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
 #include "ngraph/op/util/variable_context.hpp"
+#include "openvino/core/validation_util.hpp"
 
 namespace ngraph {
+using ov::evaluate_as_partial_shape;
+using ov::get_constant_from_source;
+using ov::infer_auto_padding;
+using ov::infer_convolution_forward;
+using ov::normalize_axes;
+using ov::normalize_axis;
+
 NGRAPH_API
 Strides conv_default_strides(const Node* node, const PartialShape& data_batch_shape, const PartialShape& filters_shape);
 
@@ -63,16 +71,6 @@ PartialShape validate_and_infer_convolution_forward_output_shape(const Node* nod
                                                                  CoordinateDiff& pads_begin,
                                                                  CoordinateDiff& pads_end);
 
-NGRAPH_API
-PartialShape infer_convolution_forward(const Node* node,
-                                       const PartialShape& data_batch_shape,
-                                       const Strides& data_dilation,
-                                       const CoordinateDiff& data_padding_below,
-                                       const CoordinateDiff& data_padding_above,
-                                       const PartialShape& filters_shape,
-                                       const Strides& filter_strides,
-                                       const Strides& filter_dilation);
-
 NGRAPH_API
 PartialShape infer_batched_pooling_forward(const Node* node,
                                            const PartialShape& data_batch_shape,
@@ -129,15 +127,6 @@ bool try_apply_auto_padding(const PartialShape& image_shape,
                             CoordinateDiff& padding_above,
                             CoordinateDiff& padding_below);
 
-NGRAPH_API
-void infer_auto_padding(const Shape& image_shape,
-                        const Shape& filter_shape,
-                        const Strides& filter_strides,
-                        const Strides& filter_dilations,
-                        const op::PadType pad_type,
-                        CoordinateDiff& padding_above,
-                        CoordinateDiff& padding_below);
-
 NGRAPH_API
 PartialShape infer_slice_shape(const Node* node,
                                const PartialShape& input_shape,
@@ -150,80 +139,6 @@ PartialShape infer_slice_shape(const Node* node,
                                const AxisSet& shrink_axis_mask,
                                const AxisSet& ellipsis_mask);
 
-/// \brief      Handle out of range axis.
-///
-/// \param[in]  node         The node with requested axis.
-/// \param[in]  axis         The requested axis value.
-/// \param[in]  tensor_rank  The corresponding tensor rank.
-///
-/// \return    Checking if axis is in range [-tensor_rank, tensor_rank-1], otherwise
-///            returns error. If negative axis, it counts from the last to the first axis,
-///            by adding tensor_rank to axis.
-NGRAPH_API
-int64_t normalize_axis(const Node* node, std::int64_t axis, const Rank& tensor_rank);
-
-/// \brief      Handle out of range axes in vector.
-///
-/// \param[in]  node_description  The name of node with requested axes.
-/// \param[in]  axes              The requested vector of axes.
-/// \param[in]  tensor_rank       The corresponding tensor rank.
-///
-/// \return     If any negative axis in vector, it counts from the last to the first
-///             axis, by adding tensor_rank to axis.
-///
-NGRAPH_API
-std::vector<size_t> normalize_axes(const std::string& node_description,
-                                   const std::vector<int64_t>& axes,
-                                   const Rank& tensor_rank);
-
-/// \brief      Handle out of range axis.
-///
-/// \param[in]  node_description   The node with requested axis.
-/// \param[in]  axis               The requested axis value.
-/// \param[in]  tensor_rank        The corresponding tensor rank.
-///
-/// \return    Checking if axis is in range [-tensor_rank, tensor_rank-1], otherwise
-///            returns error. If negative axis, it counts from the last to the first axis,
-///            by adding tensor_rank to axis.
-NGRAPH_API
-int64_t normalize_axis(const std::string& node_description, std::int64_t axis, const Rank& tensor_rank);
-
-/// \brief      Handle out of range axis.
-///
-/// \param[in]  node            The node with requested axis.
-/// \param[in]  axis            The requested axis value.
-/// \param[in]  tensor_rank     The corresponding tensor rank.
-/// \param[in]  axis_range_min  The min value of accepted range for axis.
-/// \param[in]  axis_range_max  The max value of accepted range for axis.
-///
-/// \return     Checking if axis is in range [axis_range_min, axis_range_max], otherwise
-///             returns error. If negative axis, it counts from the last to the first axis,
-///             by adding tensor_rank to axis.
-NGRAPH_API
-int64_t normalize_axis(const Node* node,
-                       std::int64_t axis,
-                       std::uint64_t tensor_rank,
-                       std::int64_t axis_range_min,
-                       std::int64_t axis_range_max);
-
-/// \brief      Handle out of range axis.
-///
-/// \param[in]  node_description   The name of node with requested axis.
-/// \param[in]  axis               The requested axis value.
-/// \param[in]  tensor_rank        The corresponding tensor rank.
-/// \param[in]  axis_range_min     The min value of accepted range for axis.
-/// \param[in]  axis_range_max     The max value of accepted range for axis.
-///
-/// \return     Checking if axis is in range [axis_range_min, axis_range_max], otherwise
-///             returns error. If negative axis, it counts from the last to the first axis,
-///             by adding tensor_rank to axis.
-NGRAPH_API
-int64_t normalize_axis(const std::string& node_description,
-                       std::int64_t axis,
-                       std::uint64_t tensor_rank,
-                       std::int64_t axis_range_min,
-                       std::int64_t axis_range_max);
-
 /// \brief Try to compute the maximum value of value
 /// \return (true, max_value) if can be determined, or (false, numeric_limits<uint64_t>::max())
 /// if not.
@@ -263,13 +178,6 @@ NGRAPH_API HostTensorPtr evaluate_upper_bound(const Output<Node>& output);
 /// could be HostTensorPtr to estimated value if particular bound can be determined, or nullptr.
 NGRAPH_API std::pair<HostTensorPtr, HostTensorPtr> evaluate_both_bounds(const Output<Node>& output);
 
-/// \brief Evaluates lower and upper value estimations for the output tensor. Estimation would
-/// be represented as partial shape object using Dimension(min, max) for each element.
-/// \param output Node output pointing to the tensor for estimation.
-/// \param pshape Resulting estimation would be stored in this PartialShape.
-/// \return boolean status if value evaluation was successful.
-NGRAPH_API bool evaluate_as_partial_shape(const Output<Node>& output, PartialShape& pshape);
-
 /// \brief Estimates upper bound for node output tensors using only upper bounds of the nodes
 /// inputs.
 /// \param node Operation to be performed
@@ -302,10 +210,6 @@ NGRAPH_API bool host_tensor_is_positive(const HostTensorPtr& bound);
 /// only on pointers comparison.
 NGRAPH_API bool has_and_set_equal_bounds(const Output<Node>& source);
 
-/// \brief Runs an estimation of source tensor. If it succeeded to calculate both bounds and
-/// they are the same returns Constant operation from the resulting bound, otherwise nullptr.
-NGRAPH_API std::shared_ptr<op::Constant> get_constant_from_source(const Output<Node>& source);
-
 /// \brief Returns a Constant storing scalar value equal to std::numeric_limits<t>::max()
 NGRAPH_API std::shared_ptr<op::Constant> get_constant_max_of_type(element::Type_t t);
 
diff --git a/ngraph/core/include/openvino/core/descriptor/tensor.hpp b/ngraph/core/include/openvino/core/descriptor/tensor.hpp
index af052dea8c6..7c727e5ec4e 100644
--- a/ngraph/core/include/openvino/core/descriptor/tensor.hpp
+++ b/ngraph/core/include/openvino/core/descriptor/tensor.hpp
@@ -5,6 +5,7 @@
 #pragma once
 
 #include <atomic>
+#include <map>
 #include <memory>
 #include <mutex>
 #include <string>
@@ -14,6 +15,7 @@
 #include "openvino/core/partial_shape.hpp"
 #include "openvino/core/shape.hpp"
 #include "openvino/core/type/element_type.hpp"
+#include "openvino/core/variant.hpp"
 
 namespace ngraph {
 namespace runtime {
@@ -74,6 +76,13 @@ public:
     }
     size_t size() const;
 
+    RTMap& get_rt_info() {
+        return m_rt_info;
+    }
+    const RTMap& get_rt_info() const {
+        return m_rt_info;
+    }
+
 protected:
     element::Type m_element_type;
 
@@ -97,6 +106,7 @@ protected:
     ngraph::HostTensorPtr m_lower_value, m_upper_value;
     std::string m_name;
     std::unordered_set<std::string> m_names;
+    std::map<std::string, std::shared_ptr<Variant>> m_rt_info;
 };
 
 OPENVINO_API
diff --git a/ngraph/core/include/openvino/core/graph_util.hpp b/ngraph/core/include/openvino/core/graph_util.hpp
new file mode 100644
index 00000000000..1ef92dab2ac
--- /dev/null
+++ b/ngraph/core/include/openvino/core/graph_util.hpp
@@ -0,0 +1,282 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <deque>
+#include <functional>
+#include <list>
+#include <memory>
+#include <stack>
+#include <string>
+#include <unordered_map>
+#include <unordered_set>
+#include <vector>
+
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/function.hpp"
+#include "openvino/core/node.hpp"
+#include "openvino/op/parameter.hpp"
+
+namespace ov {
+
+OPENVINO_API
+void traverse_nodes(const std::shared_ptr<const Function>& p,
+                    const std::function<void(const std::shared_ptr<Node>&)>& f);
+
+OPENVINO_API
+void traverse_nodes(const Function* p, const std::function<void(const std::shared_ptr<Node>&)>& f);
+
+/// \brief Visit each node in a sub-graph of the entire graph
+/// \param subgraph_results The output nodes of the sub-graph
+/// \param f Function to execute at each node in the traversal
+/// \param subgraph_params Input nodes of the sub-graph (optional)
+///
+/// Traverses a sub-graph starting from subgraph_results moving up
+/// towards parameter nodes. Traversal stops if it hits a node in
+/// subgraph_params.
+///
+/// Most useful for finding parameters of a graph directly from the
+/// result nodes and not from function parameters or extracting a
+/// subgraph relevant to the computation of certain outputs
+OPENVINO_API
+void traverse_nodes(const NodeVector& subgraph_results,
+                    const std::function<void(const std::shared_ptr<Node>&)>& f,
+                    const NodeVector& subgraph_params = {});
+
+/// \brief Replace the node `target` with the node `replacement`, i.e.,
+///        redirect all users and control dependencies of `target` to
+///        `replacement`.
+///
+/// \param target Node to be replaced.
+/// \param replacement Node to replace `target` with.
+/// \param output_order Vector determines order of replacement node's outputs.
+///
+/// This is primarily used in graph-rewriting passes. For example, we
+/// might "fuse" two Concat operations as follows:
+///
+/// (Step 0: Original graph)
+///
+///   A                       B
+///   |                       |
+///   v                       v
+/// N0[Concat, concatenation_axis=3]     C
+///          |                           |
+///          v                           v
+///        N1[Concat, concatenation_axis=3]
+///          |                |
+///          v                v
+///       some_user         another_user
+///
+/// (Step 1: Construct replacement)
+///
+///    shared_ptr<Node> new_N1 = make_shared<op::Concat>({A,B,C},3);
+///
+///   A----------------------------------------.
+///   |                                        |
+///   |                       B----------------)--.
+///   |                       |                |  |
+///   v                       v                |  |
+/// N0[Concat, concatenation_axis=3]     C-----)--)--.
+///          |                           |     |  |  |
+///          v                           v     v  v  v
+///        N1[Concat, concatenation_axis=3]   new_N1[Concat, concatenation_axis=3]
+///          |                |
+///          v                v
+///       some_user         another_user
+///
+/// (Step 2: Replace N1 with new_N1)
+///
+///    replace_node(N1, new_N1);
+///
+///   A----------------------------------------.
+///   |                                        |
+///   |                       B----------------)--.
+///   |                       |                |  |
+///   v                       v                |  |
+/// N0[Concat, concatenation_axis=3]     C-----)--)--.
+///          |                           |     |  |  |
+///          v                           v     v  v  v
+///        N1[Concat, concatenation_axis=3]   new_N1[Concat, concatenation_axis=3]
+///                                                  |                |
+///                                                  v                v
+///                                               some_user         another_user
+///
+/// (Step 3: N0 and N1 are now dead, nodes will be freed)
+///
+///    [happens automatically, once all shared_ptrs to N1 are released]
+///
+///   A----------------------------------------.
+///                                            |
+///                           B----------------)--.
+///                                            |  |
+///                                            |  |
+///                                      C-----)--)--.
+///                                            |  |  |
+///                                            v  v  v
+///                                           new_N1[Concat, concatenation_axis=3]
+///                                                  |                |
+///                                                  v                v
+///                                               some_user         another_user
+///
+/// NOTE 1: replace_node is not type-safe (the graph is not revalidated).
+/// For example, the following is allowed, even if node `some_user`
+/// requires an input of shape 2x2:
+///
+/// (Before)
+///      A(shape=2x2)  B(shape=3x3)
+///      |
+///      v
+///   some_user(requires 2x2 input)
+///
+/// (After -- graph is now invalid)
+///
+///      replace_node(A, B);
+///
+///      A(shape=2x2)  B(shape=3x3)
+///                    |
+///                    v
+///                 some_user(requires 2x2 input)
+///
+/// NOTE 2: it is possible to insert a cycle into the graph with
+/// replace_node, resulting in an invalid graph. Care must be taken to
+/// avoid this. One common example is when you are attempting to insert a
+/// new node `M` "after"` a node `N`. For example, you might expect this
+/// to work:
+///
+///    shared_ptr<Node> M = make_shared<SomeUnaryOp>(N);
+///    replace_node(M, N);
+///
+/// The problem is that at replacement time, N itself is a user of M. So
+/// we end up introducing a cycle as follows:
+///
+///       N
+///       |
+///       v
+///  other users...
+///
+///      |||
+///      vvv
+///
+///       N------------>M
+///       |
+///       v
+///  other users...
+///
+///      |||
+///      vvv
+///
+///               .----.
+///              |      |
+///              |      |
+///       N      `----->M
+///                     |
+///                     v
+///                other users...
+///
+/// To avoid the cycle, a valid way to perform the above desired insertion would be,
+///
+///        auto new_N = N->clone_with_new_inputs(N->input_values());
+///        shared_ptr<Node> M = make_shared<SomeUnaryOp>(new_N);
+///        replace_node(N, M);
+OPENVINO_API
+void replace_node(const std::shared_ptr<Node>& target,
+                  const std::shared_ptr<Node>& replacement,
+                  const std::vector<int64_t>& output_order);
+
+/// Replace target.outputs[i] with replacement_values[i] and transfer control dependents and
+/// provenance from target to the node(s) in replacement_values.
+OPENVINO_API
+void replace_node(const std::shared_ptr<Node>& target, const OutputVector& replacement_values);
+
+OPENVINO_API
+void replace_node(const std::shared_ptr<Node>& target, const std::shared_ptr<Node>& replacement);
+
+/// \brief Replace multiple nodes in a function.
+/// \param f Function where replacement is taking place.
+/// \param parameter_replacement_map A mapping from parameter shared pointers to parameter
+///                                  shared pointers. For each pair (k,v) in the map, parameter
+///                                  k is replaced by parameter v, except if k==v or k is not a
+///                                  parameter bound by f, in which case the pair (k,v) is
+///                                  ignored.
+/// \param body_replacement_map A mapping from node shared pointers to node shared pointers.
+///                             For each pair (k,v) in the map, node k is replaced by node v,
+///                             except if k==v, the pair (k,v) is ignored.
+///                             Note that if k is a parameter, its users will be redirected to
+///                             v, but k will _not_ be replaced in the function's parameter
+///                             list.
+///
+/// Limitations:
+///
+///    - No check is made that the replaced nodes in `parameter_replacement_map` are actually
+///      among the bound parameters of `f`. (If a parameter appears in the map that is not
+///      bound by `f`, it will be silently ignored.)
+///    - If a parameter node appears as a key in both `parameter_replacement_map` _and_ in
+///      `body_replacement_map`, behavior is unspecified.
+OPENVINO_API
+void replace_nodes(const std::shared_ptr<Function>& f,
+                   const std::unordered_map<std::shared_ptr<op::v0::Parameter>, std::shared_ptr<op::v0::Parameter>>&
+                       parameter_replacement_map,
+                   const std::unordered_map<std::shared_ptr<Node>, std::shared_ptr<Node>>& body_replacement_map);
+
+/// Topological sort of nodes needed to compute root_nodes
+template <typename T>
+std::vector<std::shared_ptr<Node>> topological_sort(T root_nodes) {
+    std::stack<Node*, std::vector<Node*>> nodes_to_do;
+    std::unordered_set<Node*> nodes_done;
+    std::vector<std::shared_ptr<Node>> result;
+
+    for (auto& node : root_nodes) {
+        nodes_to_do.push(node.get());
+    }
+    while (nodes_to_do.size() > 0) {
+        Node* node = nodes_to_do.top();
+        if (nodes_done.count(node) == 0) {
+            bool can_add = true;
+            size_t arg_count = node->get_input_size();
+            for (size_t i = 0; i < arg_count; ++i) {
+                Node* dep = node->get_input_node_ptr(arg_count - i - 1);
+                if (nodes_done.count(dep) == 0) {
+                    can_add = false;
+                    nodes_to_do.push(dep);
+                }
+            }
+            for (auto& depptr : node->get_control_dependencies()) {
+                Node* dep = depptr.get();
+                if (nodes_done.count(dep) == 0) {
+                    can_add = false;
+                    nodes_to_do.push(dep);
+                }
+            }
+            if (can_add) {
+                result.push_back(node->shared_from_this());
+                nodes_to_do.pop();
+                nodes_done.insert(node);
+            }
+        } else {
+            nodes_to_do.pop();
+        }
+    }
+    return result;
+}
+
+// input function is cloned and returned
+// NodeMap input may contain default node mapping i.e. pre-cloned nodes
+// NodeMap output (by reference) fully maps input and cloned function ops
+OPENVINO_API
+std::shared_ptr<ov::Function> clone_function(const ov::Function& func, NodeMap& node_map);
+
+// input function is cloned and returned
+OPENVINO_API
+std::shared_ptr<ov::Function> clone_function(const ov::Function& func);
+
+OPENVINO_API
+bool compare_constants(const std::shared_ptr<Node>& n1, const std::shared_ptr<Node>& n2);
+
+OPENVINO_API
+bool replace_output_update_name(Output<Node> node, const Output<Node>& node_input);
+
+OPENVINO_API
+bool replace_node_update_name(const std::shared_ptr<Node>& target, const std::shared_ptr<Node>& replacement);
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/core/node.hpp b/ngraph/core/include/openvino/core/node.hpp
index dc73907ec5f..8fba60194db 100644
--- a/ngraph/core/include/openvino/core/node.hpp
+++ b/ngraph/core/include/openvino/core/node.hpp
@@ -10,6 +10,7 @@
 #include <iostream>
 #include <map>
 #include <memory>
+#include <mutex>
 #include <set>
 #include <string>
 #include <tuple>
@@ -29,6 +30,7 @@
 #include "openvino/core/node_input.hpp"
 #include "openvino/core/node_output.hpp"
 #include "openvino/core/node_vector.hpp"
+#include "openvino/core/rtti.hpp"
 #include "openvino/core/strides.hpp"
 #include "openvino/core/type.hpp"
 #include "openvino/core/variant.hpp"
@@ -512,6 +514,7 @@ private:
     std::shared_ptr<ngraph::op::util::OpAnnotations> m_op_annotations;
     OPENVINO_SUPPRESS_DEPRECATED_END
     std::map<std::string, std::shared_ptr<Variant>> m_rt_info;
+    mutable std::mutex m_mutex;
 };
 
 using NodeTypeInfo = Node::type_info_t;
@@ -519,8 +522,6 @@ using NodeTypeInfo = Node::type_info_t;
 OPENVINO_API std::ostream& operator<<(std::ostream&, const Node&);
 OPENVINO_API std::ostream& operator<<(std::ostream&, const Node*);
 
-#define _OPENVINO_RTTI_EXPAND(X) X
-
 /// Helper macro that puts necessary declarations of RTTI block inside a class definition.
 /// Should be used in the scope of class that requires type identification besides one provided by
 /// C++ RTTI.
@@ -584,8 +585,6 @@ OPENVINO_API std::ostream& operator<<(std::ostream&, const Node*);
     }                                                                                     \
     _OPENVINO_RTTI_DEFINITION_COMMON(CLASS)
 
-#define _OPENVINO_RTTI_DEFINITION_SELECTOR(_1, _2, _3, _4, NAME, ...) NAME
-
 /// Complementary to OPENVINO_RTTI_DECLARATION, this helper macro _defines_ items _declared_ by
 /// OPENVINO_RTTI_DECLARATION.
 /// Should be used outside the class definition scope in place where ODR is ensured.
@@ -685,10 +684,8 @@ public:
     AttributeAdapter(std::shared_ptr<ov::Node>& value);
 
     bool visit_attributes(AttributeVisitor& visitor) override;
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<std::shared_ptr<Node>>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
+    OPENVINO_RTTI("AttributeAdapter<std::shared_ptr<Node>>");
+    BWDCMP_RTTI_DECLARATION;
 
 protected:
     std::shared_ptr<ov::Node>& m_ref;
@@ -701,10 +698,8 @@ public:
 
     bool visit_attributes(AttributeVisitor& visitor) override;
 
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<NodeVector>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
+    OPENVINO_RTTI("AttributeAdapter<NodeVector>");
+    BWDCMP_RTTI_DECLARATION;
 
 protected:
     ov::NodeVector& m_ref;
diff --git a/ngraph/core/include/openvino/core/rtti.hpp b/ngraph/core/include/openvino/core/rtti.hpp
new file mode 100644
index 00000000000..efd328f00ea
--- /dev/null
+++ b/ngraph/core/include/openvino/core/rtti.hpp
@@ -0,0 +1,105 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/type.hpp"
+
+#define _OPENVINO_RTTI_EXPAND(X)                                      X
+#define _OPENVINO_RTTI_DEFINITION_SELECTOR(_1, _2, _3, _4, NAME, ...) NAME
+
+#define _OPENVINO_RTTI_WITH_TYPE(TYPE_NAME) _OPENVINO_RTTI_WITH_TYPE_VERSION(TYPE_NAME, "util")
+
+#define _OPENVINO_RTTI_WITH_TYPE_VERSION(TYPE_NAME, VERSION_NAME)                  \
+    static const ::ov::DiscreteTypeInfo& get_type_info_static() {                  \
+        static const ::ov::DiscreteTypeInfo type_info{TYPE_NAME, 0, VERSION_NAME}; \
+        return type_info;                                                          \
+    }                                                                              \
+    const ::ov::DiscreteTypeInfo& get_type_info() const override {                 \
+        return get_type_info_static();                                             \
+    }
+
+#define _OPENVINO_RTTI_WITH_TYPE_VERSION_PARENT(TYPE_NAME, VERSION_NAME, PARENT_CLASS) \
+    _OPENVINO_RTTI_WITH_TYPE_VERSIONS_PARENT(TYPE_NAME, VERSION_NAME, PARENT_CLASS, 0)
+
+#define _OPENVINO_RTTI_WITH_TYPE_VERSIONS_PARENT(TYPE_NAME, VERSION_NAME, PARENT_CLASS, OLD_VERSION) \
+    static const ::ov::DiscreteTypeInfo& get_type_info_static() {                                    \
+        static const ::ov::DiscreteTypeInfo type_info{TYPE_NAME,                                     \
+                                                      OLD_VERSION,                                   \
+                                                      VERSION_NAME,                                  \
+                                                      &PARENT_CLASS::get_type_info_static()};        \
+        return type_info;                                                                            \
+    }                                                                                                \
+    const ::ov::DiscreteTypeInfo& get_type_info() const override {                                   \
+        return get_type_info_static();                                                               \
+    }
+/// Helper macro that puts necessary declarations of RTTI block inside a class definition.
+/// Should be used in the scope of class that requires type identification besides one provided by
+/// C++ RTTI.
+/// Recommended to be used for all classes that are inherited from class ov::Node to enable
+/// pattern
+/// matching for them. Accepts necessary type identification details like type of the operation,
+/// version and optional parent class.
+///
+/// Applying this macro within a class definition provides declaration of type_info static
+/// constant for backward compatibility with old RTTI definition for Node,
+/// static function get_type_info_static which returns a reference to an object that is equal to
+/// type_info but not necessary to the same object, and get_type_info virtual function that
+/// overrides Node::get_type_info and returns a reference to the same object that
+/// get_type_info_static gives.
+///
+/// Use this macro as a public part of the class definition:
+///
+///     class MyClass
+///     {
+///         public:
+///             OPENVINO_RTTI("MyClass", "my_version");
+///
+///             ...
+///     };
+///
+///     class MyClass2: public MyClass
+///     {
+///         public:
+///             OPENVINO_RTTI("MyClass2", "my_version2", MyClass);
+///
+///             ...
+///     };
+///
+/// \param TYPE_NAME a string literal of type const char* that names your class in type
+/// identification namespace;
+///        It is your choice how to name it, but it should be unique among all
+///        OPENVINO_RTTI_DECLARATION-enabled classes that can be
+///        used in conjunction with each other in one transformation flow.
+/// \param VERSION_NAME is an name of operation version to distinguish different versions of
+///        operations that shares the same TYPE_NAME
+/// \param PARENT_CLASS is an optional direct or indirect parent class for this class; define
+///        it only in case if there is a need to capture any operation from some group of operations
+///        that all derived from some common base class. Don't use Node as a parent, it is a base
+///        class
+///        for all operations and doesn't provide ability to define some perfect subset of
+///        operations. PARENT_CLASS should define RTTI with OPENVINO_RTTI_{DECLARATION/DEFINITION}
+///        macros.
+/// \param _VERSION_INDEX is an unsigned integer index to distinguish different versions of
+///        operations that shares the same TYPE_NAME (for backward compatibility)
+///
+/// OPENVINO_RTTI(name)
+/// OPENVINO_RTTI(name, version_id)
+/// OPENVINO_RTTI(name, version_id, parent)
+/// OPENVINO_RTTI(name, version_id, parent, old_version)
+#define OPENVINO_RTTI(...)                                                                             \
+    _OPENVINO_RTTI_EXPAND(_OPENVINO_RTTI_DEFINITION_SELECTOR(__VA_ARGS__,                              \
+                                                             _OPENVINO_RTTI_WITH_TYPE_VERSIONS_PARENT, \
+                                                             _OPENVINO_RTTI_WITH_TYPE_VERSION_PARENT,  \
+                                                             _OPENVINO_RTTI_WITH_TYPE_VERSION,         \
+                                                             _OPENVINO_RTTI_WITH_TYPE)(__VA_ARGS__))
+
+/// Note: Please don't use this macros for new operations
+#define BWDCMP_RTTI_DECLARATION                                                                    \
+    OPENVINO_DEPRECATED("This member was deprecate. Please use ::get_type_info_static() instead.") \
+    static const ov::DiscreteTypeInfo type_info
+#define BWDCMP_RTTI_DEFINITION(CLASS)                                            \
+    OPENVINO_SUPPRESS_DEPRECATED_START                                           \
+    const ov::DiscreteTypeInfo CLASS::type_info = CLASS::get_type_info_static(); \
+    OPENVINO_SUPPRESS_DEPRECATED_END
diff --git a/ngraph/core/include/openvino/core/type.hpp b/ngraph/core/include/openvino/core/type.hpp
index 78d1cc85e8d..3a742d390ce 100644
--- a/ngraph/core/include/openvino/core/type.hpp
+++ b/ngraph/core/include/openvino/core/type.hpp
@@ -8,13 +8,16 @@
 #include <cstring>
 #include <functional>
 #include <memory>
+#include <ostream>
 #include <string>
 #include <utility>
 #include <vector>
 
+#include "ngraph/compatibility.hpp"
 #include "openvino/core/core_visibility.hpp"
 
 namespace ov {
+
 /// Supports three functions, ov::is_type<Type>, ov::as_type<Type>, and ov::as_type_ptr<Type> for type-safe
 /// dynamic conversions via static_cast/static_ptr_cast without using C++ RTTI.
 /// Type must have a static type_info member and a virtual get_type_info() member that
@@ -25,6 +28,7 @@ namespace ov {
 struct OPENVINO_API DiscreteTypeInfo {
     const char* name;
     uint64_t version;
+    const char* version_id;
     // A pointer to a parent type info; used for casting and inheritance traversal, not for
     // exact type identification
     const DiscreteTypeInfo* parent;
@@ -34,6 +38,16 @@ struct OPENVINO_API DiscreteTypeInfo {
     constexpr DiscreteTypeInfo(const char* _name, uint64_t _version, const DiscreteTypeInfo* _parent = nullptr)
         : name(_name),
           version(_version),
+          version_id(nullptr),
+          parent(_parent) {}
+
+    constexpr DiscreteTypeInfo(const char* _name,
+                               uint64_t _version,
+                               const char* _version_id,
+                               const DiscreteTypeInfo* _parent = nullptr)
+        : name(_name),
+          version(_version),
+          version_id(_version_id),
           parent(_parent) {}
 
     bool is_castable(const DiscreteTypeInfo& target_type) const {
@@ -41,35 +55,39 @@ struct OPENVINO_API DiscreteTypeInfo {
     }
 
     // For use as a key
-    bool operator<(const DiscreteTypeInfo& b) const {
-        return version < b.version || (version == b.version && strcmp(name, b.name) < 0);
-    }
-    bool operator<=(const DiscreteTypeInfo& b) const {
-        return version < b.version || (version == b.version && strcmp(name, b.name) <= 0);
-    }
-    bool operator>(const DiscreteTypeInfo& b) const {
-        return version < b.version || (version == b.version && strcmp(name, b.name) > 0);
-    }
-    bool operator>=(const DiscreteTypeInfo& b) const {
-        return version < b.version || (version == b.version && strcmp(name, b.name) >= 0);
-    }
-    bool operator==(const DiscreteTypeInfo& b) const {
-        return version == b.version && strcmp(name, b.name) == 0;
-    }
-    bool operator!=(const DiscreteTypeInfo& b) const {
-        return version != b.version || strcmp(name, b.name) != 0;
-    }
+    bool operator<(const DiscreteTypeInfo& b) const;
+    bool operator<=(const DiscreteTypeInfo& b) const;
+    bool operator>(const DiscreteTypeInfo& b) const;
+    bool operator>=(const DiscreteTypeInfo& b) const;
+    bool operator==(const DiscreteTypeInfo& b) const;
+    bool operator!=(const DiscreteTypeInfo& b) const;
 };
 
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const DiscreteTypeInfo& info);
+
 /// \brief Tests if value is a pointer/shared_ptr that can be statically cast to a
 /// Type*/shared_ptr<Type>
+OPENVINO_SUPPRESS_DEPRECATED_START
 template <typename Type, typename Value>
 typename std::enable_if<
-    std::is_convertible<decltype(std::declval<Value>()->get_type_info().is_castable(Type::type_info)), bool>::value,
+    ngraph::HasTypeInfoMember<Type>::value &&
+        std::is_convertible<decltype(std::declval<Value>()->get_type_info().is_castable(Type::type_info)), bool>::value,
     bool>::type
 is_type(Value value) {
     return value->get_type_info().is_castable(Type::type_info);
 }
+OPENVINO_SUPPRESS_DEPRECATED_END
+
+template <typename Type, typename Value>
+typename std::enable_if<
+    !ngraph::HasTypeInfoMember<Type>::value &&
+        std::is_convertible<decltype(std::declval<Value>()->get_type_info().is_castable(Type::get_type_info_static())),
+                            bool>::value,
+    bool>::type
+is_type(Value value) {
+    return value->get_type_info().is_castable(Type::get_type_info_static());
+}
 
 /// Casts a Value* to a Type* if it is of type Type, nullptr otherwise
 template <typename Type, typename Value>
diff --git a/ngraph/core/include/openvino/core/validation_util.hpp b/ngraph/core/include/openvino/core/validation_util.hpp
new file mode 100644
index 00000000000..562bd988b11
--- /dev/null
+++ b/ngraph/core/include/openvino/core/validation_util.hpp
@@ -0,0 +1,117 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/coordinate_diff.hpp"
+#include "openvino/core/node.hpp"
+#include "openvino/op/constant.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+
+OPENVINO_API
+PartialShape infer_convolution_forward(const Node* node,
+                                       const PartialShape& data_batch_shape,
+                                       const Strides& data_dilation,
+                                       const CoordinateDiff& data_padding_below,
+                                       const CoordinateDiff& data_padding_above,
+                                       const PartialShape& filters_shape,
+                                       const Strides& filter_strides,
+                                       const Strides& filter_dilation);
+
+OPENVINO_API
+void infer_auto_padding(const Shape& image_shape,
+                        const Shape& filter_shape,
+                        const Strides& filter_strides,
+                        const Strides& filter_dilations,
+                        const op::PadType pad_type,
+                        CoordinateDiff& padding_above,
+                        CoordinateDiff& padding_below);
+
+/// \brief      Handle out of range axis.
+///
+/// \param[in]  node         The node with requested axis.
+/// \param[in]  axis         The requested axis value.
+/// \param[in]  tensor_rank  The corresponding tensor rank.
+///
+/// \return    Checking if axis is in range [-tensor_rank, tensor_rank-1], otherwise
+///            returns error. If negative axis, it counts from the last to the first axis,
+///            by adding tensor_rank to axis.
+OPENVINO_API
+int64_t normalize_axis(const Node* node, std::int64_t axis, const Rank& tensor_rank);
+
+/// \brief      Handle out of range axes in vector.
+///
+/// \param[in]  node_description  The name of node with requested axes.
+/// \param[in]  axes              The requested vector of axes.
+/// \param[in]  tensor_rank       The corresponding tensor rank.
+///
+/// \return     If any negative axis in vector, it counts from the last to the first
+///             axis, by adding tensor_rank to axis.
+///
+OPENVINO_API
+std::vector<size_t> normalize_axes(const std::string& node_description,
+                                   const std::vector<int64_t>& axes,
+                                   const Rank& tensor_rank);
+
+/// \brief      Handle out of range axis.
+///
+/// \param[in]  node_description   The node with requested axis.
+/// \param[in]  axis               The requested axis value.
+/// \param[in]  tensor_rank        The corresponding tensor rank.
+///
+/// \return    Checking if axis is in range [-tensor_rank, tensor_rank-1], otherwise
+///            returns error. If negative axis, it counts from the last to the first axis,
+///            by adding tensor_rank to axis.
+OPENVINO_API
+int64_t normalize_axis(const std::string& node_description, std::int64_t axis, const Rank& tensor_rank);
+
+/// \brief      Handle out of range axis.
+///
+/// \param[in]  node            The node with requested axis.
+/// \param[in]  axis            The requested axis value.
+/// \param[in]  tensor_rank     The corresponding tensor rank.
+/// \param[in]  axis_range_min  The min value of accepted range for axis.
+/// \param[in]  axis_range_max  The max value of accepted range for axis.
+///
+/// \return     Checking if axis is in range [axis_range_min, axis_range_max], otherwise
+///             returns error. If negative axis, it counts from the last to the first axis,
+///             by adding tensor_rank to axis.
+OPENVINO_API
+int64_t normalize_axis(const Node* node,
+                       std::int64_t axis,
+                       std::uint64_t tensor_rank,
+                       std::int64_t axis_range_min,
+                       std::int64_t axis_range_max);
+
+/// \brief      Handle out of range axis.
+///
+/// \param[in]  node_description   The name of node with requested axis.
+/// \param[in]  axis               The requested axis value.
+/// \param[in]  tensor_rank        The corresponding tensor rank.
+/// \param[in]  axis_range_min     The min value of accepted range for axis.
+/// \param[in]  axis_range_max     The max value of accepted range for axis.
+///
+/// \return     Checking if axis is in range [axis_range_min, axis_range_max], otherwise
+///             returns error. If negative axis, it counts from the last to the first axis,
+///             by adding tensor_rank to axis.
+OPENVINO_API
+int64_t normalize_axis(const std::string& node_description,
+                       std::int64_t axis,
+                       std::uint64_t tensor_rank,
+                       std::int64_t axis_range_min,
+                       std::int64_t axis_range_max);
+
+/// \brief Evaluates lower and upper value estimations for the output tensor. Estimation would
+/// be represented as partial shape object using Dimension(min, max) for each element.
+/// \param output Node output pointing to the tensor for estimation.
+/// \param pshape Resulting estimation would be stored in this PartialShape.
+/// \return boolean status if value evaluation was successful.
+OPENVINO_API bool evaluate_as_partial_shape(const Output<Node>& output, PartialShape& pshape);
+
+/// \brief Runs an estimation of source tensor. If it succeeded to calculate both bounds and
+/// they are the same returns Constant operation from the resulting bound, otherwise nullptr.
+OPENVINO_API std::shared_ptr<op::v0::Constant> get_constant_from_source(const Output<Node>& source);
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/core/variant.hpp b/ngraph/core/include/openvino/core/variant.hpp
index 2157c4bfa7d..86595a57eb2 100644
--- a/ngraph/core/include/openvino/core/variant.hpp
+++ b/ngraph/core/include/openvino/core/variant.hpp
@@ -93,4 +93,5 @@ inline std::shared_ptr<Variant> make_variant(const wchar_t (&s)[N]) {
 #endif
 
 using RTMap = std::map<std::string, std::shared_ptr<Variant>>;
+using VariantVector = std::vector<std::shared_ptr<Variant>>;
 }  // namespace ov
diff --git a/ngraph/core/include/openvino/op/constant.hpp b/ngraph/core/include/openvino/op/constant.hpp
index f36f6aeb569..d6a738db058 100644
--- a/ngraph/core/include/openvino/op/constant.hpp
+++ b/ngraph/core/include/openvino/op/constant.hpp
@@ -227,6 +227,11 @@ public:
     OPENVINO_DEPRECATED("Use Constant c-tor with shape argument instead")
     void set_data_shape(const Shape& shape);
 
+    /// \brief Return data size in bytes
+    size_t get_byte_size() const {
+        return m_data->size();
+    }
+
     /// \brief Wrapper around constructing a shared_ptr of a Constant
     ///
     /// \param type The element type of the tensor constant.
diff --git a/ngraph/core/include/openvino/op/interpolate.hpp b/ngraph/core/include/openvino/op/interpolate.hpp
index bc195f3d8c5..17fee0725b2 100644
--- a/ngraph/core/include/openvino/op/interpolate.hpp
+++ b/ngraph/core/include/openvino/op/interpolate.hpp
@@ -22,7 +22,7 @@ public:
     /// \brief Structure that specifies attributes for interpolation
     struct Attributes {
         // specify dimension indices where interpolation is applied, and `axes` is any
-        // unordered list of indeces of different dimensions of input tensor. Required.
+        // unordered list of indices of different dimensions of input tensor. Required.
         AxisSet axes;
         // specifies type of interpolation
         // one of `nearest`, `linear`, `cubic`, `area`. Required.
diff --git a/ngraph/core/include/openvino/op/op.hpp b/ngraph/core/include/openvino/op/op.hpp
index 65a1493d630..c7920537c8a 100644
--- a/ngraph/core/include/openvino/op/op.hpp
+++ b/ngraph/core/include/openvino/op/op.hpp
@@ -7,6 +7,19 @@
 #include <string>
 
 #include "openvino/core/node.hpp"
+#include "openvino/core/rtti.hpp"
+
+#define _OPENVINO_RTTI_OP_WITH_TYPE(TYPE_NAME) _OPENVINO_RTTI_OP_WITH_TYPE_VERSION(TYPE_NAME, "extension")
+
+#define _OPENVINO_RTTI_OP_WITH_TYPE_VERSION(TYPE_NAME, VERSION_NAME) \
+    _OPENVINO_RTTI_WITH_TYPE_VERSION_PARENT(TYPE_NAME, VERSION_NAME, ::ov::op::Op)
+
+#define OPENVINO_OP(...)                                                                               \
+    _OPENVINO_RTTI_EXPAND(_OPENVINO_RTTI_DEFINITION_SELECTOR(__VA_ARGS__,                              \
+                                                             _OPENVINO_RTTI_WITH_TYPE_VERSIONS_PARENT, \
+                                                             _OPENVINO_RTTI_WITH_TYPE_VERSION_PARENT,  \
+                                                             _OPENVINO_RTTI_OP_WITH_TYPE_VERSION,      \
+                                                             _OPENVINO_RTTI_OP_WITH_TYPE)(__VA_ARGS__))
 
 namespace ov {
 namespace op {
@@ -15,6 +28,15 @@ class OPENVINO_API Op : public Node {
 protected:
     Op() : Node() {}
     Op(const OutputVector& arguments);
+
+public:
+    static const ::ov::Node::type_info_t& get_type_info_static() {
+        static const ::ov::Node::type_info_t info{"Op", 0, "util"};
+        return info;
+    }
+    const ::ov::Node::type_info_t& get_type_info() const override {
+        return get_type_info_static();
+    }
 };
 }  // namespace op
 }  // namespace ov
diff --git a/ngraph/core/include/openvino/op/parameter.hpp b/ngraph/core/include/openvino/op/parameter.hpp
index 7878f582927..3396b160664 100644
--- a/ngraph/core/include/openvino/op/parameter.hpp
+++ b/ngraph/core/include/openvino/op/parameter.hpp
@@ -4,6 +4,7 @@
 
 #pragma once
 
+#include "openvino/core/layout.hpp"
 #include "openvino/op/op.hpp"
 
 namespace ov {
@@ -50,6 +51,12 @@ public:
         m_element_type = element_type;
     }
 
+    /// \brief Returns current layout, or empty Layout if it is not set
+    Layout get_layout() const;
+
+    /// \brief Sets layout runtime information to tensor
+    void set_layout(const Layout& layout);
+
 protected:
     PartialShape m_partial_shape;
     element::Type m_element_type;
diff --git a/ngraph/core/include/openvino/opsets/opset.hpp b/ngraph/core/include/openvino/opsets/opset.hpp
index 8503d815313..de26023d4e9 100644
--- a/ngraph/core/include/openvino/opsets/opset.hpp
+++ b/ngraph/core/include/openvino/opsets/opset.hpp
@@ -10,7 +10,9 @@
 #include <set>
 #include <utility>
 
+#include "ngraph/compatibility.hpp"
 #include "ngraph/factory.hpp"
+#include "openvino/core/deprecated.hpp"
 #include "openvino/core/node.hpp"
 
 namespace ov {
@@ -27,15 +29,27 @@ public:
     }
 
     /// \brief Insert OP_TYPE into the opset with a special name and the default factory
-    template <typename OP_TYPE>
+    template <typename OP_TYPE, typename std::enable_if<!ngraph::HasTypeInfoMember<OP_TYPE>::value, bool>::type = true>
     void insert(const std::string& name) {
+        insert(name, OP_TYPE::get_type_info_static(), ngraph::FactoryRegistry<Node>::get_default_factory<OP_TYPE>());
+    }
+    template <typename OP_TYPE, typename std::enable_if<ngraph::HasTypeInfoMember<OP_TYPE>::value, bool>::type = true>
+    void insert(const std::string& name) {
+        OPENVINO_SUPPRESS_DEPRECATED_START
         insert(name, OP_TYPE::type_info, ngraph::FactoryRegistry<Node>::get_default_factory<OP_TYPE>());
+        OPENVINO_SUPPRESS_DEPRECATED_END
     }
 
     /// \brief Insert OP_TYPE into the opset with the default name and factory
-    template <typename OP_TYPE>
+    template <typename OP_TYPE, typename std::enable_if<!ngraph::HasTypeInfoMember<OP_TYPE>::value, bool>::type = true>
     void insert() {
+        insert<OP_TYPE>(OP_TYPE::get_type_info_static().name);
+    }
+    template <typename OP_TYPE, typename std::enable_if<ngraph::HasTypeInfoMember<OP_TYPE>::value, bool>::type = true>
+    void insert() {
+        OPENVINO_SUPPRESS_DEPRECATED_START
         insert<OP_TYPE>(OP_TYPE::type_info.name);
+        OPENVINO_SUPPRESS_DEPRECATED_END
     }
 
     const std::set<NodeTypeInfo>& get_types_info() const {
@@ -54,9 +68,15 @@ public:
     }
 
     /// \brief Return true if OP_TYPE is in the opset
-    template <typename OP_TYPE>
+    template <typename OP_TYPE, typename std::enable_if<!ngraph::HasTypeInfoMember<OP_TYPE>::value, bool>::type = true>
     bool contains_type() const {
+        return contains_type(OP_TYPE::get_type_info_static());
+    }
+    template <typename OP_TYPE, typename std::enable_if<ngraph::HasTypeInfoMember<OP_TYPE>::value, bool>::type = true>
+    bool contains_type() const {
+        OPENVINO_SUPPRESS_DEPRECATED_START
         return contains_type(OP_TYPE::type_info);
+        OPENVINO_SUPPRESS_DEPRECATED_END
     }
 
     /// \brief Return true if name is in the opset
diff --git a/ngraph/core/include/openvino/opsets/opset1.hpp b/ngraph/core/include/openvino/opsets/opset1.hpp
index 47eb6effa88..07cbdd8f5dc 100644
--- a/ngraph/core/include/openvino/opsets/opset1.hpp
+++ b/ngraph/core/include/openvino/opsets/opset1.hpp
@@ -8,8 +8,8 @@
 
 namespace ov {
 namespace opset1 {
-#define OPENVINO_OP(a, b) using b::a;
+#define _OPENVINO_OP_REG(a, b) using b::a;
 #include "openvino/opsets/opset1_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
 }  // namespace opset1
 }  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset1_tbl.hpp b/ngraph/core/include/openvino/opsets/opset1_tbl.hpp
index faa7100c007..8758949bc98 100644
--- a/ngraph/core/include/openvino/opsets/opset1_tbl.hpp
+++ b/ngraph/core/include/openvino/opsets/opset1_tbl.hpp
@@ -5,26 +5,26 @@
 // This collection contains one entry for each op. If an op is added it must be
 // added to this list.
 //
-// In order to use this list you want to define a macro named exactly OPENVINO_OP
+// In order to use this list you want to define a macro named exactly _OPENVINO_OP_REG
 // When you are done you should undef the macro
 // As an example if you wanted to make a list of all op names as strings you could do this:
 //
-// #define OPENVINO_OP(a,b) #a,
+// #define _OPENVINO_OP_REG(a,b) #a,
 // std::vector<std::string> op_names{
 // #include "this include file name"
 // };
-// #undef OPENVINO_OP
+// #undef _OPENVINO_OP_REG
 //
 // This sample expands to a list like this:
 // "Abs",
 // "Acos",
 // ...
 //
-// #define OPENVINO_OP(a,b) b::a,
+// #define _OPENVINO_OP_REG(a,b) b::a,
 // std::vector<std::string> op_names{
 // #include "this include file name"
 // };
-// #undef OPENVINO_OP
+// #undef _OPENVINO_OP_REG
 //
 // This sample expands to a list like this:
 // ov::op::Abs,
@@ -33,118 +33,118 @@
 //
 // It's that easy. You can use this for fun and profit.
 
-#ifndef OPENVINO_OP
-#    warning "OPENVINO_OP not defined"
-#    define OPENVINO_OP(x, y)
+#ifndef _OPENVINO_OP_REG
+#    warning "_OPENVINO_OP_REG not defined"
+#    define _OPENVINO_OP_REG(x, y)
 #endif
 
-OPENVINO_OP(Abs, ov::op::v0)
-OPENVINO_OP(Acos, ov::op::v0)
-OPENVINO_OP(Add, ov::op::v1)
-OPENVINO_OP(Asin, ov::op::v0)
-OPENVINO_OP(Atan, ov::op::v0)
-OPENVINO_OP(AvgPool, ov::op::v1)
-OPENVINO_OP(BatchNormInference, ov::op::v0)
-OPENVINO_OP(BinaryConvolution, ov::op::v1)
-OPENVINO_OP(Broadcast, ov::op::v1)
-OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
-OPENVINO_OP(Ceiling, ov::op::v0)
-OPENVINO_OP(Clamp, ov::op::v0)
-OPENVINO_OP(Concat, ov::op::v0)
-OPENVINO_OP(Constant, ov::op::v0)
-OPENVINO_OP(Convert, ov::op::v0)
-OPENVINO_OP(ConvertLike, ov::op::v1)
-OPENVINO_OP(Convolution, ov::op::v1)
-OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(Cos, ov::op::v0)
-OPENVINO_OP(Cosh, ov::op::v0)
-OPENVINO_OP(DeformableConvolution, ov::op::v1)
-OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
-OPENVINO_OP(DepthToSpace, ov::op::v0)
-OPENVINO_OP(DetectionOutput, ov::op::v0)
-OPENVINO_OP(Divide, ov::op::v1)
-OPENVINO_OP(Elu, ov::op::v0)
-OPENVINO_OP(Erf, ov::op::v0)
-OPENVINO_OP(Equal, ov::op::v1)
-OPENVINO_OP(Exp, ov::op::v0)
-OPENVINO_OP(FakeQuantize, ov::op::v0)
-OPENVINO_OP(Floor, ov::op::v0)
-OPENVINO_OP(FloorMod, ov::op::v1)
-OPENVINO_OP(Gather, ov::op::v1)
-OPENVINO_OP(GatherTree, ov::op::v1)
-OPENVINO_OP(Greater, ov::op::v1)
-OPENVINO_OP(GreaterEqual, ov::op::v1)
-OPENVINO_OP(GroupConvolution, ov::op::v1)
-OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(GRN, ov::op::v0)
-OPENVINO_OP(HardSigmoid, ov::op::v0)
-OPENVINO_OP(Interpolate, ov::op::v0)
-OPENVINO_OP(Less, ov::op::v1)
-OPENVINO_OP(LessEqual, ov::op::v1)
-OPENVINO_OP(Log, ov::op::v0)
-OPENVINO_OP(LogicalAnd, ov::op::v1)
-OPENVINO_OP(LogicalNot, ov::op::v1)
-OPENVINO_OP(LogicalOr, ov::op::v1)
-OPENVINO_OP(LogicalXor, ov::op::v1)
-OPENVINO_OP(LRN, ov::op::v0)
-OPENVINO_OP(LSTMCell, ov::op::v0)
-OPENVINO_OP(LSTMSequence, ov::op::v0)
-OPENVINO_OP(MatMul, ov::op::v0)
-OPENVINO_OP(MaxPool, ov::op::v1)
-OPENVINO_OP(Maximum, ov::op::v1)
-OPENVINO_OP(Minimum, ov::op::v1)
-OPENVINO_OP(Mod, ov::op::v1)
-OPENVINO_OP(Multiply, ov::op::v1)
-OPENVINO_OP(Negative, ov::op::v0)
-OPENVINO_OP(NonMaxSuppression, ov::op::v1)
-OPENVINO_OP(NormalizeL2, ov::op::v0)
-OPENVINO_OP(NotEqual, ov::op::v1)
-OPENVINO_OP(OneHot, ov::op::v1)
-OPENVINO_OP(PRelu, ov::op::v0)
-OPENVINO_OP(PSROIPooling, ov::op::v0)
-OPENVINO_OP(Pad, ov::op::v1)
-OPENVINO_OP(Parameter, ov::op::v0)
-OPENVINO_OP(Power, ov::op::v1)
-OPENVINO_OP(PriorBox, ov::op::v0)
-OPENVINO_OP(PriorBoxClustered, ov::op::v0)
-OPENVINO_OP(Proposal, ov::op::v0)
-OPENVINO_OP(Range, ov::op::v0)
-OPENVINO_OP(Relu, ov::op::v0)
-OPENVINO_OP(ReduceMax, ov::op::v1)
-OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
-OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
-OPENVINO_OP(ReduceMean, ov::op::v1)
-OPENVINO_OP(ReduceMin, ov::op::v1)
-OPENVINO_OP(ReduceProd, ov::op::v1)
-OPENVINO_OP(ReduceSum, ov::op::v1)
-OPENVINO_OP(RegionYolo, ov::op::v0)
-OPENVINO_OP(Reshape, ov::op::v1)
-OPENVINO_OP(Result, ov::op::v0)
-OPENVINO_OP(Reverse, ov::op::v1)
-OPENVINO_OP(ReverseSequence, ov::op::v0)
-OPENVINO_OP(RNNCell, ov::op::v0)
-OPENVINO_OP(Select, ov::op::v1)
-OPENVINO_OP(Selu, ov::op::v0)
-OPENVINO_OP(ShapeOf, ov::op::v0)
-OPENVINO_OP(ShuffleChannels, ov::op::v0)
-OPENVINO_OP(Sign, ov::op::v0)
-OPENVINO_OP(Sigmoid, ov::op::v0)
-OPENVINO_OP(Sin, ov::op::v0)
-OPENVINO_OP(Sinh, ov::op::v0)
-OPENVINO_OP(Softmax, ov::op::v1)
-OPENVINO_OP(Sqrt, ov::op::v0)
-OPENVINO_OP(SpaceToDepth, ov::op::v0)
-OPENVINO_OP(Split, ov::op::v1)
-OPENVINO_OP(SquaredDifference, ov::op::v0)
-OPENVINO_OP(Squeeze, ov::op::v0)
-OPENVINO_OP(StridedSlice, ov::op::v1)
-OPENVINO_OP(Subtract, ov::op::v1)
-OPENVINO_OP(Tan, ov::op::v0)
-OPENVINO_OP(Tanh, ov::op::v0)
-OPENVINO_OP(TensorIterator, ov::op::v0)
-OPENVINO_OP(Tile, ov::op::v0)
-OPENVINO_OP(TopK, ov::op::v1)
-OPENVINO_OP(Transpose, ov::op::v1)
-OPENVINO_OP(Unsqueeze, ov::op::v0)
-OPENVINO_OP(VariadicSplit, ov::op::v1)
-OPENVINO_OP(Xor, ov::op::v0)
+_OPENVINO_OP_REG(Abs, ov::op::v0)
+_OPENVINO_OP_REG(Acos, ov::op::v0)
+_OPENVINO_OP_REG(Add, ov::op::v1)
+_OPENVINO_OP_REG(Asin, ov::op::v0)
+_OPENVINO_OP_REG(Atan, ov::op::v0)
+_OPENVINO_OP_REG(AvgPool, ov::op::v1)
+_OPENVINO_OP_REG(BatchNormInference, ov::op::v0)
+_OPENVINO_OP_REG(BinaryConvolution, ov::op::v1)
+_OPENVINO_OP_REG(Broadcast, ov::op::v1)
+_OPENVINO_OP_REG(CTCGreedyDecoder, ov::op::v0)
+_OPENVINO_OP_REG(Ceiling, ov::op::v0)
+_OPENVINO_OP_REG(Clamp, ov::op::v0)
+_OPENVINO_OP_REG(Concat, ov::op::v0)
+_OPENVINO_OP_REG(Constant, ov::op::v0)
+_OPENVINO_OP_REG(Convert, ov::op::v0)
+_OPENVINO_OP_REG(ConvertLike, ov::op::v1)
+_OPENVINO_OP_REG(Convolution, ov::op::v1)
+_OPENVINO_OP_REG(ConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(Cos, ov::op::v0)
+_OPENVINO_OP_REG(Cosh, ov::op::v0)
+_OPENVINO_OP_REG(DeformableConvolution, ov::op::v1)
+_OPENVINO_OP_REG(DeformablePSROIPooling, ov::op::v1)
+_OPENVINO_OP_REG(DepthToSpace, ov::op::v0)
+_OPENVINO_OP_REG(DetectionOutput, ov::op::v0)
+_OPENVINO_OP_REG(Divide, ov::op::v1)
+_OPENVINO_OP_REG(Elu, ov::op::v0)
+_OPENVINO_OP_REG(Erf, ov::op::v0)
+_OPENVINO_OP_REG(Equal, ov::op::v1)
+_OPENVINO_OP_REG(Exp, ov::op::v0)
+_OPENVINO_OP_REG(FakeQuantize, ov::op::v0)
+_OPENVINO_OP_REG(Floor, ov::op::v0)
+_OPENVINO_OP_REG(FloorMod, ov::op::v1)
+_OPENVINO_OP_REG(Gather, ov::op::v1)
+_OPENVINO_OP_REG(GatherTree, ov::op::v1)
+_OPENVINO_OP_REG(Greater, ov::op::v1)
+_OPENVINO_OP_REG(GreaterEqual, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolution, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(GRN, ov::op::v0)
+_OPENVINO_OP_REG(HardSigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Interpolate, ov::op::v0)
+_OPENVINO_OP_REG(Less, ov::op::v1)
+_OPENVINO_OP_REG(LessEqual, ov::op::v1)
+_OPENVINO_OP_REG(Log, ov::op::v0)
+_OPENVINO_OP_REG(LogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(LogicalNot, ov::op::v1)
+_OPENVINO_OP_REG(LogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(LogicalXor, ov::op::v1)
+_OPENVINO_OP_REG(LRN, ov::op::v0)
+_OPENVINO_OP_REG(LSTMCell, ov::op::v0)
+_OPENVINO_OP_REG(LSTMSequence, ov::op::v0)
+_OPENVINO_OP_REG(MatMul, ov::op::v0)
+_OPENVINO_OP_REG(MaxPool, ov::op::v1)
+_OPENVINO_OP_REG(Maximum, ov::op::v1)
+_OPENVINO_OP_REG(Minimum, ov::op::v1)
+_OPENVINO_OP_REG(Mod, ov::op::v1)
+_OPENVINO_OP_REG(Multiply, ov::op::v1)
+_OPENVINO_OP_REG(Negative, ov::op::v0)
+_OPENVINO_OP_REG(NonMaxSuppression, ov::op::v1)
+_OPENVINO_OP_REG(NormalizeL2, ov::op::v0)
+_OPENVINO_OP_REG(NotEqual, ov::op::v1)
+_OPENVINO_OP_REG(OneHot, ov::op::v1)
+_OPENVINO_OP_REG(PRelu, ov::op::v0)
+_OPENVINO_OP_REG(PSROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(Pad, ov::op::v1)
+_OPENVINO_OP_REG(Parameter, ov::op::v0)
+_OPENVINO_OP_REG(Power, ov::op::v1)
+_OPENVINO_OP_REG(PriorBox, ov::op::v0)
+_OPENVINO_OP_REG(PriorBoxClustered, ov::op::v0)
+_OPENVINO_OP_REG(Proposal, ov::op::v0)
+_OPENVINO_OP_REG(Range, ov::op::v0)
+_OPENVINO_OP_REG(Relu, ov::op::v0)
+_OPENVINO_OP_REG(ReduceMax, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMean, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMin, ov::op::v1)
+_OPENVINO_OP_REG(ReduceProd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceSum, ov::op::v1)
+_OPENVINO_OP_REG(RegionYolo, ov::op::v0)
+_OPENVINO_OP_REG(Reshape, ov::op::v1)
+_OPENVINO_OP_REG(Result, ov::op::v0)
+_OPENVINO_OP_REG(Reverse, ov::op::v1)
+_OPENVINO_OP_REG(ReverseSequence, ov::op::v0)
+_OPENVINO_OP_REG(RNNCell, ov::op::v0)
+_OPENVINO_OP_REG(Select, ov::op::v1)
+_OPENVINO_OP_REG(Selu, ov::op::v0)
+_OPENVINO_OP_REG(ShapeOf, ov::op::v0)
+_OPENVINO_OP_REG(ShuffleChannels, ov::op::v0)
+_OPENVINO_OP_REG(Sign, ov::op::v0)
+_OPENVINO_OP_REG(Sigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Sin, ov::op::v0)
+_OPENVINO_OP_REG(Sinh, ov::op::v0)
+_OPENVINO_OP_REG(Softmax, ov::op::v1)
+_OPENVINO_OP_REG(Sqrt, ov::op::v0)
+_OPENVINO_OP_REG(SpaceToDepth, ov::op::v0)
+_OPENVINO_OP_REG(Split, ov::op::v1)
+_OPENVINO_OP_REG(SquaredDifference, ov::op::v0)
+_OPENVINO_OP_REG(Squeeze, ov::op::v0)
+_OPENVINO_OP_REG(StridedSlice, ov::op::v1)
+_OPENVINO_OP_REG(Subtract, ov::op::v1)
+_OPENVINO_OP_REG(Tan, ov::op::v0)
+_OPENVINO_OP_REG(Tanh, ov::op::v0)
+_OPENVINO_OP_REG(TensorIterator, ov::op::v0)
+_OPENVINO_OP_REG(Tile, ov::op::v0)
+_OPENVINO_OP_REG(TopK, ov::op::v1)
+_OPENVINO_OP_REG(Transpose, ov::op::v1)
+_OPENVINO_OP_REG(Unsqueeze, ov::op::v0)
+_OPENVINO_OP_REG(VariadicSplit, ov::op::v1)
+_OPENVINO_OP_REG(Xor, ov::op::v0)
diff --git a/ngraph/core/include/openvino/opsets/opset2.hpp b/ngraph/core/include/openvino/opsets/opset2.hpp
index 24c1b1befe2..0ab87a47e94 100644
--- a/ngraph/core/include/openvino/opsets/opset2.hpp
+++ b/ngraph/core/include/openvino/opsets/opset2.hpp
@@ -8,8 +8,8 @@
 
 namespace ov {
 namespace opset2 {
-#define OPENVINO_OP(a, b) using b::a;
+#define _OPENVINO_OP_REG(a, b) using b::a;
 #include "openvino/opsets/opset2_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
 }  // namespace opset2
 }  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset2_tbl.hpp b/ngraph/core/include/openvino/opsets/opset2_tbl.hpp
index 80ac1d7f658..9a101eb8e9d 100644
--- a/ngraph/core/include/openvino/opsets/opset2_tbl.hpp
+++ b/ngraph/core/include/openvino/opsets/opset2_tbl.hpp
@@ -2,142 +2,142 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#ifndef OPENVINO_OP
-#    warning "OPENVINO_OP not defined"
-#    define OPENVINO_OP(x, y)
+#ifndef _OPENVINO_OP_REG
+#    warning "_OPENVINO_OP_REG not defined"
+#    define _OPENVINO_OP_REG(x, y)
 #endif
 
-OPENVINO_OP(Abs, ov::op::v0)
-OPENVINO_OP(Acos, ov::op::v0)
-OPENVINO_OP(Add, ov::op::v1)
-OPENVINO_OP(Asin, ov::op::v0)
-OPENVINO_OP(Atan, ov::op::v0)
-OPENVINO_OP(AvgPool, ov::op::v1)
-OPENVINO_OP(BatchNormInference, ov::op::v0)
-OPENVINO_OP(BinaryConvolution, ov::op::v1)
-OPENVINO_OP(Broadcast, ov::op::v1)
-OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
-OPENVINO_OP(Ceiling, ov::op::v0)
-OPENVINO_OP(Clamp, ov::op::v0)
-OPENVINO_OP(Concat, ov::op::v0)
-OPENVINO_OP(Constant, ov::op::v0)
-OPENVINO_OP(Convert, ov::op::v0)
-OPENVINO_OP(ConvertLike, ov::op::v1)
-OPENVINO_OP(Convolution, ov::op::v1)
-OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(Cos, ov::op::v0)
-OPENVINO_OP(Cosh, ov::op::v0)
-OPENVINO_OP(DeformableConvolution, ov::op::v1)
-OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
-OPENVINO_OP(DepthToSpace, ov::op::v0)
-OPENVINO_OP(DetectionOutput, ov::op::v0)
-OPENVINO_OP(Divide, ov::op::v1)
-OPENVINO_OP(Elu, ov::op::v0)
-OPENVINO_OP(Erf, ov::op::v0)
-OPENVINO_OP(Equal, ov::op::v1)
-OPENVINO_OP(Exp, ov::op::v0)
-OPENVINO_OP(FakeQuantize, ov::op::v0)
-OPENVINO_OP(Floor, ov::op::v0)
-OPENVINO_OP(FloorMod, ov::op::v1)
-OPENVINO_OP(Gather, ov::op::v1)
-OPENVINO_OP(GatherTree, ov::op::v1)
-OPENVINO_OP(Greater, ov::op::v1)
-OPENVINO_OP(GreaterEqual, ov::op::v1)
-OPENVINO_OP(GroupConvolution, ov::op::v1)
-OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(GRN, ov::op::v0)
-OPENVINO_OP(HardSigmoid, ov::op::v0)
-OPENVINO_OP(Interpolate, ov::op::v0)
-OPENVINO_OP(Less, ov::op::v1)
-OPENVINO_OP(LessEqual, ov::op::v1)
-OPENVINO_OP(Log, ov::op::v0)
-OPENVINO_OP(LogicalAnd, ov::op::v1)
-OPENVINO_OP(LogicalNot, ov::op::v1)
-OPENVINO_OP(LogicalOr, ov::op::v1)
-OPENVINO_OP(LogicalXor, ov::op::v1)
-OPENVINO_OP(LRN, ov::op::v0)
-OPENVINO_OP(LSTMCell, ov::op::v0)
-OPENVINO_OP(LSTMSequence, ov::op::v0)
-OPENVINO_OP(MatMul, ov::op::v0)
-OPENVINO_OP(MaxPool, ov::op::v1)
-OPENVINO_OP(Maximum, ov::op::v1)
-OPENVINO_OP(Minimum, ov::op::v1)
-OPENVINO_OP(Mod, ov::op::v1)
-OPENVINO_OP(Multiply, ov::op::v1)
+_OPENVINO_OP_REG(Abs, ov::op::v0)
+_OPENVINO_OP_REG(Acos, ov::op::v0)
+_OPENVINO_OP_REG(Add, ov::op::v1)
+_OPENVINO_OP_REG(Asin, ov::op::v0)
+_OPENVINO_OP_REG(Atan, ov::op::v0)
+_OPENVINO_OP_REG(AvgPool, ov::op::v1)
+_OPENVINO_OP_REG(BatchNormInference, ov::op::v0)
+_OPENVINO_OP_REG(BinaryConvolution, ov::op::v1)
+_OPENVINO_OP_REG(Broadcast, ov::op::v1)
+_OPENVINO_OP_REG(CTCGreedyDecoder, ov::op::v0)
+_OPENVINO_OP_REG(Ceiling, ov::op::v0)
+_OPENVINO_OP_REG(Clamp, ov::op::v0)
+_OPENVINO_OP_REG(Concat, ov::op::v0)
+_OPENVINO_OP_REG(Constant, ov::op::v0)
+_OPENVINO_OP_REG(Convert, ov::op::v0)
+_OPENVINO_OP_REG(ConvertLike, ov::op::v1)
+_OPENVINO_OP_REG(Convolution, ov::op::v1)
+_OPENVINO_OP_REG(ConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(Cos, ov::op::v0)
+_OPENVINO_OP_REG(Cosh, ov::op::v0)
+_OPENVINO_OP_REG(DeformableConvolution, ov::op::v1)
+_OPENVINO_OP_REG(DeformablePSROIPooling, ov::op::v1)
+_OPENVINO_OP_REG(DepthToSpace, ov::op::v0)
+_OPENVINO_OP_REG(DetectionOutput, ov::op::v0)
+_OPENVINO_OP_REG(Divide, ov::op::v1)
+_OPENVINO_OP_REG(Elu, ov::op::v0)
+_OPENVINO_OP_REG(Erf, ov::op::v0)
+_OPENVINO_OP_REG(Equal, ov::op::v1)
+_OPENVINO_OP_REG(Exp, ov::op::v0)
+_OPENVINO_OP_REG(FakeQuantize, ov::op::v0)
+_OPENVINO_OP_REG(Floor, ov::op::v0)
+_OPENVINO_OP_REG(FloorMod, ov::op::v1)
+_OPENVINO_OP_REG(Gather, ov::op::v1)
+_OPENVINO_OP_REG(GatherTree, ov::op::v1)
+_OPENVINO_OP_REG(Greater, ov::op::v1)
+_OPENVINO_OP_REG(GreaterEqual, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolution, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(GRN, ov::op::v0)
+_OPENVINO_OP_REG(HardSigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Interpolate, ov::op::v0)
+_OPENVINO_OP_REG(Less, ov::op::v1)
+_OPENVINO_OP_REG(LessEqual, ov::op::v1)
+_OPENVINO_OP_REG(Log, ov::op::v0)
+_OPENVINO_OP_REG(LogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(LogicalNot, ov::op::v1)
+_OPENVINO_OP_REG(LogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(LogicalXor, ov::op::v1)
+_OPENVINO_OP_REG(LRN, ov::op::v0)
+_OPENVINO_OP_REG(LSTMCell, ov::op::v0)
+_OPENVINO_OP_REG(LSTMSequence, ov::op::v0)
+_OPENVINO_OP_REG(MatMul, ov::op::v0)
+_OPENVINO_OP_REG(MaxPool, ov::op::v1)
+_OPENVINO_OP_REG(Maximum, ov::op::v1)
+_OPENVINO_OP_REG(Minimum, ov::op::v1)
+_OPENVINO_OP_REG(Mod, ov::op::v1)
+_OPENVINO_OP_REG(Multiply, ov::op::v1)
 
-OPENVINO_OP(MVN, ov::op::v0)  // Missing in opset1
+_OPENVINO_OP_REG(MVN, ov::op::v0)  // Missing in opset1
 
-OPENVINO_OP(Negative, ov::op::v0)
-OPENVINO_OP(NonMaxSuppression, ov::op::v1)
-OPENVINO_OP(NormalizeL2, ov::op::v0)
-OPENVINO_OP(NotEqual, ov::op::v1)
-OPENVINO_OP(OneHot, ov::op::v1)
-OPENVINO_OP(PRelu, ov::op::v0)
-OPENVINO_OP(PSROIPooling, ov::op::v0)
-OPENVINO_OP(Pad, ov::op::v1)
-OPENVINO_OP(Parameter, ov::op::v0)
-OPENVINO_OP(Power, ov::op::v1)
-OPENVINO_OP(PriorBox, ov::op::v0)
-OPENVINO_OP(PriorBoxClustered, ov::op::v0)
-OPENVINO_OP(Proposal, ov::op::v0)
-OPENVINO_OP(Range, ov::op::v0)
-OPENVINO_OP(Relu, ov::op::v0)
-OPENVINO_OP(ReduceMax, ov::op::v1)
-OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
-OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
-OPENVINO_OP(ReduceMean, ov::op::v1)
-OPENVINO_OP(ReduceMin, ov::op::v1)
-OPENVINO_OP(ReduceProd, ov::op::v1)
-OPENVINO_OP(ReduceSum, ov::op::v1)
-OPENVINO_OP(RegionYolo, ov::op::v0)
+_OPENVINO_OP_REG(Negative, ov::op::v0)
+_OPENVINO_OP_REG(NonMaxSuppression, ov::op::v1)
+_OPENVINO_OP_REG(NormalizeL2, ov::op::v0)
+_OPENVINO_OP_REG(NotEqual, ov::op::v1)
+_OPENVINO_OP_REG(OneHot, ov::op::v1)
+_OPENVINO_OP_REG(PRelu, ov::op::v0)
+_OPENVINO_OP_REG(PSROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(Pad, ov::op::v1)
+_OPENVINO_OP_REG(Parameter, ov::op::v0)
+_OPENVINO_OP_REG(Power, ov::op::v1)
+_OPENVINO_OP_REG(PriorBox, ov::op::v0)
+_OPENVINO_OP_REG(PriorBoxClustered, ov::op::v0)
+_OPENVINO_OP_REG(Proposal, ov::op::v0)
+_OPENVINO_OP_REG(Range, ov::op::v0)
+_OPENVINO_OP_REG(Relu, ov::op::v0)
+_OPENVINO_OP_REG(ReduceMax, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMean, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMin, ov::op::v1)
+_OPENVINO_OP_REG(ReduceProd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceSum, ov::op::v1)
+_OPENVINO_OP_REG(RegionYolo, ov::op::v0)
 
-OPENVINO_OP(ReorgYolo, ov::op::v0)  // Missing in opset1
+_OPENVINO_OP_REG(ReorgYolo, ov::op::v0)  // Missing in opset1
 
-OPENVINO_OP(Reshape, ov::op::v1)
-OPENVINO_OP(Result, ov::op::v0)
+_OPENVINO_OP_REG(Reshape, ov::op::v1)
+_OPENVINO_OP_REG(Result, ov::op::v0)
 
 // Moved out of opset2, it was added to opset1 by mistake
-// OPENVINO_OP(Reverse, ov::op::v1)
+// _OPENVINO_OP_REG(Reverse, ov::op::v1)
 
-OPENVINO_OP(ReverseSequence, ov::op::v0)
+_OPENVINO_OP_REG(ReverseSequence, ov::op::v0)
 
 // Moved out of opset2, it was added to opset1 by mistake
-// OPENVINO_OP(RNNCell, ov::op::v0)
+// _OPENVINO_OP_REG(RNNCell, ov::op::v0)
 
-OPENVINO_OP(ROIPooling, ov::op::v0)  // Missing in opset1
+_OPENVINO_OP_REG(ROIPooling, ov::op::v0)  // Missing in opset1
 
-OPENVINO_OP(Select, ov::op::v1)
-OPENVINO_OP(Selu, ov::op::v0)
-OPENVINO_OP(ShapeOf, ov::op::v0)
+_OPENVINO_OP_REG(Select, ov::op::v1)
+_OPENVINO_OP_REG(Selu, ov::op::v0)
+_OPENVINO_OP_REG(ShapeOf, ov::op::v0)
 
 // Moved out of opset2, it was added to opset1 by mistake
-// OPENVINO_OP(ShuffleChannels, ov::op::v0)
+// _OPENVINO_OP_REG(ShuffleChannels, ov::op::v0)
 
-OPENVINO_OP(Sign, ov::op::v0)
-OPENVINO_OP(Sigmoid, ov::op::v0)
-OPENVINO_OP(Sin, ov::op::v0)
-OPENVINO_OP(Sinh, ov::op::v0)
-OPENVINO_OP(Softmax, ov::op::v1)
-OPENVINO_OP(Sqrt, ov::op::v0)
-OPENVINO_OP(SpaceToDepth, ov::op::v0)
-OPENVINO_OP(Split, ov::op::v1)
-OPENVINO_OP(SquaredDifference, ov::op::v0)
-OPENVINO_OP(Squeeze, ov::op::v0)
-OPENVINO_OP(StridedSlice, ov::op::v1)
-OPENVINO_OP(Subtract, ov::op::v1)
-OPENVINO_OP(Tan, ov::op::v0)
-OPENVINO_OP(Tanh, ov::op::v0)
-OPENVINO_OP(TensorIterator, ov::op::v0)
-OPENVINO_OP(Tile, ov::op::v0)
-OPENVINO_OP(TopK, ov::op::v1)
-OPENVINO_OP(Transpose, ov::op::v1)
-OPENVINO_OP(Unsqueeze, ov::op::v0)
-OPENVINO_OP(VariadicSplit, ov::op::v1)
+_OPENVINO_OP_REG(Sign, ov::op::v0)
+_OPENVINO_OP_REG(Sigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Sin, ov::op::v0)
+_OPENVINO_OP_REG(Sinh, ov::op::v0)
+_OPENVINO_OP_REG(Softmax, ov::op::v1)
+_OPENVINO_OP_REG(Sqrt, ov::op::v0)
+_OPENVINO_OP_REG(SpaceToDepth, ov::op::v0)
+_OPENVINO_OP_REG(Split, ov::op::v1)
+_OPENVINO_OP_REG(SquaredDifference, ov::op::v0)
+_OPENVINO_OP_REG(Squeeze, ov::op::v0)
+_OPENVINO_OP_REG(StridedSlice, ov::op::v1)
+_OPENVINO_OP_REG(Subtract, ov::op::v1)
+_OPENVINO_OP_REG(Tan, ov::op::v0)
+_OPENVINO_OP_REG(Tanh, ov::op::v0)
+_OPENVINO_OP_REG(TensorIterator, ov::op::v0)
+_OPENVINO_OP_REG(Tile, ov::op::v0)
+_OPENVINO_OP_REG(TopK, ov::op::v1)
+_OPENVINO_OP_REG(Transpose, ov::op::v1)
+_OPENVINO_OP_REG(Unsqueeze, ov::op::v0)
+_OPENVINO_OP_REG(VariadicSplit, ov::op::v1)
 
 // Moved out of opset2, it was added to opset1 by mistake
-// OPENVINO_OP(Xor, ov::op::v0)
+// _OPENVINO_OP_REG(Xor, ov::op::v0)
 
 // New operations added in opset2
-OPENVINO_OP(Gelu, ov::op::v0)
-OPENVINO_OP(BatchToSpace, ov::op::v1)
-OPENVINO_OP(SpaceToBatch, ov::op::v1)
+_OPENVINO_OP_REG(Gelu, ov::op::v0)
+_OPENVINO_OP_REG(BatchToSpace, ov::op::v1)
+_OPENVINO_OP_REG(SpaceToBatch, ov::op::v1)
diff --git a/ngraph/core/include/openvino/opsets/opset3.hpp b/ngraph/core/include/openvino/opsets/opset3.hpp
index a2f60e8a9f1..45dd79c8612 100644
--- a/ngraph/core/include/openvino/opsets/opset3.hpp
+++ b/ngraph/core/include/openvino/opsets/opset3.hpp
@@ -8,8 +8,8 @@
 
 namespace ov {
 namespace opset3 {
-#define OPENVINO_OP(a, b) using b::a;
+#define _OPENVINO_OP_REG(a, b) using b::a;
 #include "openvino/opsets/opset3_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
 }  // namespace opset3
 }  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset3_tbl.hpp b/ngraph/core/include/openvino/opsets/opset3_tbl.hpp
index c6369b99b68..30e4f0ae242 100644
--- a/ngraph/core/include/openvino/opsets/opset3_tbl.hpp
+++ b/ngraph/core/include/openvino/opsets/opset3_tbl.hpp
@@ -2,158 +2,158 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#ifndef OPENVINO_OP
-#    warning "OPENVINO_OP not defined"
-#    define OPENVINO_OP(x, y)
+#ifndef _OPENVINO_OP_REG
+#    warning "_OPENVINO_OP_REG not defined"
+#    define _OPENVINO_OP_REG(x, y)
 #endif
 
-OPENVINO_OP(Abs, ov::op::v0)
-OPENVINO_OP(Acos, ov::op::v0)
-OPENVINO_OP(Add, ov::op::v1)
-OPENVINO_OP(Asin, ov::op::v0)
-OPENVINO_OP(Atan, ov::op::v0)
-OPENVINO_OP(AvgPool, ov::op::v1)
-OPENVINO_OP(BatchNormInference, ov::op::v0)
-OPENVINO_OP(BinaryConvolution, ov::op::v1)
-OPENVINO_OP(Broadcast, ov::op::v3)
-OPENVINO_OP(Bucketize, ov::op::v3)
-OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
-OPENVINO_OP(Ceiling, ov::op::v0)
-OPENVINO_OP(Clamp, ov::op::v0)
-OPENVINO_OP(Concat, ov::op::v0)
-OPENVINO_OP(Constant, ov::op::v0)
-OPENVINO_OP(Convert, ov::op::v0)
-OPENVINO_OP(ConvertLike, ov::op::v1)
-OPENVINO_OP(Convolution, ov::op::v1)
-OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(Cos, ov::op::v0)
-OPENVINO_OP(Cosh, ov::op::v0)
-OPENVINO_OP(CumSum, ov::op::v0)
-OPENVINO_OP(DeformableConvolution, ov::op::v1)
-OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
-OPENVINO_OP(DepthToSpace, ov::op::v0)
-OPENVINO_OP(DetectionOutput, ov::op::v0)
-OPENVINO_OP(Divide, ov::op::v1)
-OPENVINO_OP(Elu, ov::op::v0)
-OPENVINO_OP(Erf, ov::op::v0)
-OPENVINO_OP(Equal, ov::op::v1)
-OPENVINO_OP(Exp, ov::op::v0)
-OPENVINO_OP(ExtractImagePatches, ov::op::v3)
-OPENVINO_OP(FakeQuantize, ov::op::v0)
-OPENVINO_OP(Floor, ov::op::v0)
-OPENVINO_OP(FloorMod, ov::op::v1)
-OPENVINO_OP(Gather, ov::op::v1)
-OPENVINO_OP(GatherTree, ov::op::v1)
-OPENVINO_OP(Greater, ov::op::v1)
-OPENVINO_OP(GreaterEqual, ov::op::v1)
-OPENVINO_OP(GroupConvolution, ov::op::v1)
-OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(GRN, ov::op::v0)
-OPENVINO_OP(HardSigmoid, ov::op::v0)
-OPENVINO_OP(Interpolate, ov::op::v0)
-OPENVINO_OP(Less, ov::op::v1)
-OPENVINO_OP(LessEqual, ov::op::v1)
-OPENVINO_OP(Log, ov::op::v0)
-OPENVINO_OP(LogicalAnd, ov::op::v1)
-OPENVINO_OP(LogicalNot, ov::op::v1)
-OPENVINO_OP(LogicalOr, ov::op::v1)
-OPENVINO_OP(LogicalXor, ov::op::v1)
-OPENVINO_OP(LRN, ov::op::v0)
-OPENVINO_OP(LSTMCell, ov::op::v0)
-OPENVINO_OP(LSTMSequence, ov::op::v0)
-OPENVINO_OP(MatMul, ov::op::v0)
-OPENVINO_OP(MaxPool, ov::op::v1)
-OPENVINO_OP(Maximum, ov::op::v1)
-OPENVINO_OP(Minimum, ov::op::v1)
-OPENVINO_OP(Mod, ov::op::v1)
-OPENVINO_OP(Multiply, ov::op::v1)
+_OPENVINO_OP_REG(Abs, ov::op::v0)
+_OPENVINO_OP_REG(Acos, ov::op::v0)
+_OPENVINO_OP_REG(Add, ov::op::v1)
+_OPENVINO_OP_REG(Asin, ov::op::v0)
+_OPENVINO_OP_REG(Atan, ov::op::v0)
+_OPENVINO_OP_REG(AvgPool, ov::op::v1)
+_OPENVINO_OP_REG(BatchNormInference, ov::op::v0)
+_OPENVINO_OP_REG(BinaryConvolution, ov::op::v1)
+_OPENVINO_OP_REG(Broadcast, ov::op::v3)
+_OPENVINO_OP_REG(Bucketize, ov::op::v3)
+_OPENVINO_OP_REG(CTCGreedyDecoder, ov::op::v0)
+_OPENVINO_OP_REG(Ceiling, ov::op::v0)
+_OPENVINO_OP_REG(Clamp, ov::op::v0)
+_OPENVINO_OP_REG(Concat, ov::op::v0)
+_OPENVINO_OP_REG(Constant, ov::op::v0)
+_OPENVINO_OP_REG(Convert, ov::op::v0)
+_OPENVINO_OP_REG(ConvertLike, ov::op::v1)
+_OPENVINO_OP_REG(Convolution, ov::op::v1)
+_OPENVINO_OP_REG(ConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(Cos, ov::op::v0)
+_OPENVINO_OP_REG(Cosh, ov::op::v0)
+_OPENVINO_OP_REG(CumSum, ov::op::v0)
+_OPENVINO_OP_REG(DeformableConvolution, ov::op::v1)
+_OPENVINO_OP_REG(DeformablePSROIPooling, ov::op::v1)
+_OPENVINO_OP_REG(DepthToSpace, ov::op::v0)
+_OPENVINO_OP_REG(DetectionOutput, ov::op::v0)
+_OPENVINO_OP_REG(Divide, ov::op::v1)
+_OPENVINO_OP_REG(Elu, ov::op::v0)
+_OPENVINO_OP_REG(Erf, ov::op::v0)
+_OPENVINO_OP_REG(Equal, ov::op::v1)
+_OPENVINO_OP_REG(Exp, ov::op::v0)
+_OPENVINO_OP_REG(ExtractImagePatches, ov::op::v3)
+_OPENVINO_OP_REG(FakeQuantize, ov::op::v0)
+_OPENVINO_OP_REG(Floor, ov::op::v0)
+_OPENVINO_OP_REG(FloorMod, ov::op::v1)
+_OPENVINO_OP_REG(Gather, ov::op::v1)
+_OPENVINO_OP_REG(GatherTree, ov::op::v1)
+_OPENVINO_OP_REG(Greater, ov::op::v1)
+_OPENVINO_OP_REG(GreaterEqual, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolution, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(GRN, ov::op::v0)
+_OPENVINO_OP_REG(HardSigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Interpolate, ov::op::v0)
+_OPENVINO_OP_REG(Less, ov::op::v1)
+_OPENVINO_OP_REG(LessEqual, ov::op::v1)
+_OPENVINO_OP_REG(Log, ov::op::v0)
+_OPENVINO_OP_REG(LogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(LogicalNot, ov::op::v1)
+_OPENVINO_OP_REG(LogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(LogicalXor, ov::op::v1)
+_OPENVINO_OP_REG(LRN, ov::op::v0)
+_OPENVINO_OP_REG(LSTMCell, ov::op::v0)
+_OPENVINO_OP_REG(LSTMSequence, ov::op::v0)
+_OPENVINO_OP_REG(MatMul, ov::op::v0)
+_OPENVINO_OP_REG(MaxPool, ov::op::v1)
+_OPENVINO_OP_REG(Maximum, ov::op::v1)
+_OPENVINO_OP_REG(Minimum, ov::op::v1)
+_OPENVINO_OP_REG(Mod, ov::op::v1)
+_OPENVINO_OP_REG(Multiply, ov::op::v1)
 
-OPENVINO_OP(MVN, ov::op::v0)  // Missing in opset1
+_OPENVINO_OP_REG(MVN, ov::op::v0)  // Missing in opset1
 
-OPENVINO_OP(Negative, ov::op::v0)
-OPENVINO_OP(NonMaxSuppression, ov::op::v3)
-OPENVINO_OP(NormalizeL2, ov::op::v0)
-OPENVINO_OP(NotEqual, ov::op::v1)
-OPENVINO_OP(OneHot, ov::op::v1)
-OPENVINO_OP(PRelu, ov::op::v0)
-OPENVINO_OP(PSROIPooling, ov::op::v0)
-OPENVINO_OP(Pad, ov::op::v1)
-OPENVINO_OP(Parameter, ov::op::v0)
-OPENVINO_OP(Power, ov::op::v1)
-OPENVINO_OP(PriorBox, ov::op::v0)
-OPENVINO_OP(PriorBoxClustered, ov::op::v0)
-OPENVINO_OP(Proposal, ov::op::v0)
-OPENVINO_OP(Range, ov::op::v0)
-OPENVINO_OP(Relu, ov::op::v0)
-OPENVINO_OP(ReduceMax, ov::op::v1)
-OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
-OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
-OPENVINO_OP(ReduceMean, ov::op::v1)
-OPENVINO_OP(ReduceMin, ov::op::v1)
-OPENVINO_OP(ReduceProd, ov::op::v1)
-OPENVINO_OP(ReduceSum, ov::op::v1)
-OPENVINO_OP(RegionYolo, ov::op::v0)
+_OPENVINO_OP_REG(Negative, ov::op::v0)
+_OPENVINO_OP_REG(NonMaxSuppression, ov::op::v3)
+_OPENVINO_OP_REG(NormalizeL2, ov::op::v0)
+_OPENVINO_OP_REG(NotEqual, ov::op::v1)
+_OPENVINO_OP_REG(OneHot, ov::op::v1)
+_OPENVINO_OP_REG(PRelu, ov::op::v0)
+_OPENVINO_OP_REG(PSROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(Pad, ov::op::v1)
+_OPENVINO_OP_REG(Parameter, ov::op::v0)
+_OPENVINO_OP_REG(Power, ov::op::v1)
+_OPENVINO_OP_REG(PriorBox, ov::op::v0)
+_OPENVINO_OP_REG(PriorBoxClustered, ov::op::v0)
+_OPENVINO_OP_REG(Proposal, ov::op::v0)
+_OPENVINO_OP_REG(Range, ov::op::v0)
+_OPENVINO_OP_REG(Relu, ov::op::v0)
+_OPENVINO_OP_REG(ReduceMax, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMean, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMin, ov::op::v1)
+_OPENVINO_OP_REG(ReduceProd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceSum, ov::op::v1)
+_OPENVINO_OP_REG(RegionYolo, ov::op::v0)
 
-OPENVINO_OP(ReorgYolo, ov::op::v0)  // Missing in opset1
+_OPENVINO_OP_REG(ReorgYolo, ov::op::v0)  // Missing in opset1
 
-OPENVINO_OP(Reshape, ov::op::v1)
-OPENVINO_OP(Result, ov::op::v0)
+_OPENVINO_OP_REG(Reshape, ov::op::v1)
+_OPENVINO_OP_REG(Result, ov::op::v0)
 
 // Moved out of opset2, it was added to opset1 by mistake
-// OPENVINO_OP(Reverse, ov::op::v1)
+// _OPENVINO_OP_REG(Reverse, ov::op::v1)
 
-OPENVINO_OP(ReverseSequence, ov::op::v0)
+_OPENVINO_OP_REG(ReverseSequence, ov::op::v0)
 
 // Moved out of opset2, it was added to opset1 by mistake
-// OPENVINO_OP(RNNCell, ov::op::v0)
+// _OPENVINO_OP_REG(RNNCell, ov::op::v0)
 
-OPENVINO_OP(ROIPooling, ov::op::v0)  // Missing in opset1
+_OPENVINO_OP_REG(ROIPooling, ov::op::v0)  // Missing in opset1
 
-OPENVINO_OP(Select, ov::op::v1)
-OPENVINO_OP(Selu, ov::op::v0)
+_OPENVINO_OP_REG(Select, ov::op::v1)
+_OPENVINO_OP_REG(Selu, ov::op::v0)
 // Superseded
-// OPENVINO_OP(ShapeOf, ov::op::v0)
+// _OPENVINO_OP_REG(ShapeOf, ov::op::v0)
 
-OPENVINO_OP(Sign, ov::op::v0)
-OPENVINO_OP(Sigmoid, ov::op::v0)
-OPENVINO_OP(Sin, ov::op::v0)
-OPENVINO_OP(Sinh, ov::op::v0)
-OPENVINO_OP(Softmax, ov::op::v1)
-OPENVINO_OP(Sqrt, ov::op::v0)
-OPENVINO_OP(SpaceToDepth, ov::op::v0)
-OPENVINO_OP(Split, ov::op::v1)
-OPENVINO_OP(SquaredDifference, ov::op::v0)
-OPENVINO_OP(Squeeze, ov::op::v0)
-OPENVINO_OP(StridedSlice, ov::op::v1)
-OPENVINO_OP(Subtract, ov::op::v1)
-OPENVINO_OP(Tan, ov::op::v0)
-OPENVINO_OP(Tanh, ov::op::v0)
-OPENVINO_OP(TensorIterator, ov::op::v0)
-OPENVINO_OP(Tile, ov::op::v0)
-OPENVINO_OP(Transpose, ov::op::v1)
-OPENVINO_OP(Unsqueeze, ov::op::v0)
-OPENVINO_OP(VariadicSplit, ov::op::v1)
+_OPENVINO_OP_REG(Sign, ov::op::v0)
+_OPENVINO_OP_REG(Sigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Sin, ov::op::v0)
+_OPENVINO_OP_REG(Sinh, ov::op::v0)
+_OPENVINO_OP_REG(Softmax, ov::op::v1)
+_OPENVINO_OP_REG(Sqrt, ov::op::v0)
+_OPENVINO_OP_REG(SpaceToDepth, ov::op::v0)
+_OPENVINO_OP_REG(Split, ov::op::v1)
+_OPENVINO_OP_REG(SquaredDifference, ov::op::v0)
+_OPENVINO_OP_REG(Squeeze, ov::op::v0)
+_OPENVINO_OP_REG(StridedSlice, ov::op::v1)
+_OPENVINO_OP_REG(Subtract, ov::op::v1)
+_OPENVINO_OP_REG(Tan, ov::op::v0)
+_OPENVINO_OP_REG(Tanh, ov::op::v0)
+_OPENVINO_OP_REG(TensorIterator, ov::op::v0)
+_OPENVINO_OP_REG(Tile, ov::op::v0)
+_OPENVINO_OP_REG(Transpose, ov::op::v1)
+_OPENVINO_OP_REG(Unsqueeze, ov::op::v0)
+_OPENVINO_OP_REG(VariadicSplit, ov::op::v1)
 
 // Moved out of opset2, it was added to opset1 by mistake
-// OPENVINO_OP(Xor, ov::op::v0)
+// _OPENVINO_OP_REG(Xor, ov::op::v0)
 
 // New operations added in opset2
-OPENVINO_OP(Gelu, ov::op::v0)
-OPENVINO_OP(BatchToSpace, ov::op::v1)
-OPENVINO_OP(SpaceToBatch, ov::op::v1)
+_OPENVINO_OP_REG(Gelu, ov::op::v0)
+_OPENVINO_OP_REG(BatchToSpace, ov::op::v1)
+_OPENVINO_OP_REG(SpaceToBatch, ov::op::v1)
 
 // New operations added in opset3
-OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
-OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
-OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
-OPENVINO_OP(GRUCell, ov::op::v3)
-OPENVINO_OP(NonZero, ov::op::v3)
-OPENVINO_OP(RNNCell, ov::op::v0)
-OPENVINO_OP(ROIAlign, ov::op::v3)
-OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
-OPENVINO_OP(ScatterUpdate, ov::op::v3)
-OPENVINO_OP(ShuffleChannels, ov::op::v0)
-OPENVINO_OP(ShapeOf, ov::op::v3)
-OPENVINO_OP(Assign, ov::op::v3)
-OPENVINO_OP(ReadValue, ov::op::v3)
-OPENVINO_OP(TopK, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagPackedSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingSegmentsSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagOffsetsSum, ov::op::v3)
+_OPENVINO_OP_REG(GRUCell, ov::op::v3)
+_OPENVINO_OP_REG(NonZero, ov::op::v3)
+_OPENVINO_OP_REG(RNNCell, ov::op::v0)
+_OPENVINO_OP_REG(ROIAlign, ov::op::v3)
+_OPENVINO_OP_REG(ScatterElementsUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ScatterUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ShuffleChannels, ov::op::v0)
+_OPENVINO_OP_REG(ShapeOf, ov::op::v3)
+_OPENVINO_OP_REG(Assign, ov::op::v3)
+_OPENVINO_OP_REG(ReadValue, ov::op::v3)
+_OPENVINO_OP_REG(TopK, ov::op::v3)
diff --git a/ngraph/core/include/openvino/opsets/opset4.hpp b/ngraph/core/include/openvino/opsets/opset4.hpp
index 369ea427e9e..b51c614845c 100644
--- a/ngraph/core/include/openvino/opsets/opset4.hpp
+++ b/ngraph/core/include/openvino/opsets/opset4.hpp
@@ -8,8 +8,8 @@
 
 namespace ov {
 namespace opset4 {
-#define OPENVINO_OP(a, b) using b::a;
+#define _OPENVINO_OP_REG(a, b) using b::a;
 #include "openvino/opsets/opset4_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
 }  // namespace opset4
 }  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset4_tbl.hpp b/ngraph/core/include/openvino/opsets/opset4_tbl.hpp
index 320916daf48..cfef0d933df 100644
--- a/ngraph/core/include/openvino/opsets/opset4_tbl.hpp
+++ b/ngraph/core/include/openvino/opsets/opset4_tbl.hpp
@@ -2,151 +2,151 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#ifndef OPENVINO_OP
-#    warning "OPENVINO_OP not defined"
-#    define OPENVINO_OP(x, y)
+#ifndef _OPENVINO_OP_REG
+#    warning "_OPENVINO_OP_REG not defined"
+#    define _OPENVINO_OP_REG(x, y)
 #endif
 
-OPENVINO_OP(Abs, ov::op::v0)
-OPENVINO_OP(Acos, ov::op::v0)
-OPENVINO_OP(Add, ov::op::v1)
-OPENVINO_OP(Asin, ov::op::v0)
-OPENVINO_OP(Atan, ov::op::v0)
-OPENVINO_OP(AvgPool, ov::op::v1)
-OPENVINO_OP(BatchNormInference, ov::op::v0)
-OPENVINO_OP(BinaryConvolution, ov::op::v1)
-OPENVINO_OP(Broadcast, ov::op::v3)
-OPENVINO_OP(Bucketize, ov::op::v3)
-OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
-OPENVINO_OP(Ceiling, ov::op::v0)
-OPENVINO_OP(Clamp, ov::op::v0)
-OPENVINO_OP(Concat, ov::op::v0)
-OPENVINO_OP(Constant, ov::op::v0)
-OPENVINO_OP(Convert, ov::op::v0)
-OPENVINO_OP(ConvertLike, ov::op::v1)
-OPENVINO_OP(Convolution, ov::op::v1)
-OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(Cos, ov::op::v0)
-OPENVINO_OP(Cosh, ov::op::v0)
-OPENVINO_OP(CumSum, ov::op::v0)
-OPENVINO_OP(DeformableConvolution, ov::op::v1)
-OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
-OPENVINO_OP(DepthToSpace, ov::op::v0)
-OPENVINO_OP(DetectionOutput, ov::op::v0)
-OPENVINO_OP(Divide, ov::op::v1)
-OPENVINO_OP(Elu, ov::op::v0)
-OPENVINO_OP(Erf, ov::op::v0)
-OPENVINO_OP(Equal, ov::op::v1)
-OPENVINO_OP(Exp, ov::op::v0)
-OPENVINO_OP(ExtractImagePatches, ov::op::v3)
-OPENVINO_OP(FakeQuantize, ov::op::v0)
-OPENVINO_OP(Floor, ov::op::v0)
-OPENVINO_OP(FloorMod, ov::op::v1)
-OPENVINO_OP(Gather, ov::op::v1)
-OPENVINO_OP(GatherTree, ov::op::v1)
-OPENVINO_OP(Greater, ov::op::v1)
-OPENVINO_OP(GreaterEqual, ov::op::v1)
-OPENVINO_OP(GroupConvolution, ov::op::v1)
-OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(GRN, ov::op::v0)
-OPENVINO_OP(HardSigmoid, ov::op::v0)
-OPENVINO_OP(Less, ov::op::v1)
-OPENVINO_OP(LessEqual, ov::op::v1)
-OPENVINO_OP(Log, ov::op::v0)
-OPENVINO_OP(LogicalAnd, ov::op::v1)
-OPENVINO_OP(LogicalNot, ov::op::v1)
-OPENVINO_OP(LogicalOr, ov::op::v1)
-OPENVINO_OP(LogicalXor, ov::op::v1)
-OPENVINO_OP(LRN, ov::op::v0)
-OPENVINO_OP(LSTMCell, ov::op::v4)
-OPENVINO_OP(MatMul, ov::op::v0)
-OPENVINO_OP(MaxPool, ov::op::v1)
-OPENVINO_OP(Maximum, ov::op::v1)
-OPENVINO_OP(Minimum, ov::op::v1)
-OPENVINO_OP(Mod, ov::op::v1)
-OPENVINO_OP(Multiply, ov::op::v1)
-OPENVINO_OP(MVN, ov::op::v0)
-OPENVINO_OP(Negative, ov::op::v0)
-OPENVINO_OP(NormalizeL2, ov::op::v0)
-OPENVINO_OP(NotEqual, ov::op::v1)
-OPENVINO_OP(OneHot, ov::op::v1)
-OPENVINO_OP(PRelu, ov::op::v0)
-OPENVINO_OP(PSROIPooling, ov::op::v0)
-OPENVINO_OP(Pad, ov::op::v1)
-OPENVINO_OP(Parameter, ov::op::v0)
-OPENVINO_OP(Power, ov::op::v1)
-OPENVINO_OP(PriorBox, ov::op::v0)
-OPENVINO_OP(PriorBoxClustered, ov::op::v0)
-OPENVINO_OP(Proposal, ov::op::v4)
-OPENVINO_OP(Range, ov::op::v4)
-OPENVINO_OP(Relu, ov::op::v0)
-OPENVINO_OP(ReduceMax, ov::op::v1)
-OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
-OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
-OPENVINO_OP(ReduceMean, ov::op::v1)
-OPENVINO_OP(ReduceMin, ov::op::v1)
-OPENVINO_OP(ReduceProd, ov::op::v1)
-OPENVINO_OP(ReduceSum, ov::op::v1)
-OPENVINO_OP(RegionYolo, ov::op::v0)
-OPENVINO_OP(ReorgYolo, ov::op::v0)
-OPENVINO_OP(Reshape, ov::op::v1)
-OPENVINO_OP(Result, ov::op::v0)
-OPENVINO_OP(ReverseSequence, ov::op::v0)
-OPENVINO_OP(ROIPooling, ov::op::v0)
-OPENVINO_OP(ScatterNDUpdate, ov::op::v3)
-OPENVINO_OP(Select, ov::op::v1)
-OPENVINO_OP(Selu, ov::op::v0)
-OPENVINO_OP(Sign, ov::op::v0)
-OPENVINO_OP(Sigmoid, ov::op::v0)
-OPENVINO_OP(Sin, ov::op::v0)
-OPENVINO_OP(Sinh, ov::op::v0)
-OPENVINO_OP(Softmax, ov::op::v1)
-OPENVINO_OP(Sqrt, ov::op::v0)
-OPENVINO_OP(SpaceToDepth, ov::op::v0)
-OPENVINO_OP(Split, ov::op::v1)
-OPENVINO_OP(SquaredDifference, ov::op::v0)
-OPENVINO_OP(Squeeze, ov::op::v0)
-OPENVINO_OP(StridedSlice, ov::op::v1)
-OPENVINO_OP(Subtract, ov::op::v1)
-OPENVINO_OP(Tan, ov::op::v0)
-OPENVINO_OP(Tanh, ov::op::v0)
-OPENVINO_OP(TensorIterator, ov::op::v0)
-OPENVINO_OP(Tile, ov::op::v0)
-OPENVINO_OP(Transpose, ov::op::v1)
-OPENVINO_OP(Unsqueeze, ov::op::v0)
-OPENVINO_OP(VariadicSplit, ov::op::v1)
+_OPENVINO_OP_REG(Abs, ov::op::v0)
+_OPENVINO_OP_REG(Acos, ov::op::v0)
+_OPENVINO_OP_REG(Add, ov::op::v1)
+_OPENVINO_OP_REG(Asin, ov::op::v0)
+_OPENVINO_OP_REG(Atan, ov::op::v0)
+_OPENVINO_OP_REG(AvgPool, ov::op::v1)
+_OPENVINO_OP_REG(BatchNormInference, ov::op::v0)
+_OPENVINO_OP_REG(BinaryConvolution, ov::op::v1)
+_OPENVINO_OP_REG(Broadcast, ov::op::v3)
+_OPENVINO_OP_REG(Bucketize, ov::op::v3)
+_OPENVINO_OP_REG(CTCGreedyDecoder, ov::op::v0)
+_OPENVINO_OP_REG(Ceiling, ov::op::v0)
+_OPENVINO_OP_REG(Clamp, ov::op::v0)
+_OPENVINO_OP_REG(Concat, ov::op::v0)
+_OPENVINO_OP_REG(Constant, ov::op::v0)
+_OPENVINO_OP_REG(Convert, ov::op::v0)
+_OPENVINO_OP_REG(ConvertLike, ov::op::v1)
+_OPENVINO_OP_REG(Convolution, ov::op::v1)
+_OPENVINO_OP_REG(ConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(Cos, ov::op::v0)
+_OPENVINO_OP_REG(Cosh, ov::op::v0)
+_OPENVINO_OP_REG(CumSum, ov::op::v0)
+_OPENVINO_OP_REG(DeformableConvolution, ov::op::v1)
+_OPENVINO_OP_REG(DeformablePSROIPooling, ov::op::v1)
+_OPENVINO_OP_REG(DepthToSpace, ov::op::v0)
+_OPENVINO_OP_REG(DetectionOutput, ov::op::v0)
+_OPENVINO_OP_REG(Divide, ov::op::v1)
+_OPENVINO_OP_REG(Elu, ov::op::v0)
+_OPENVINO_OP_REG(Erf, ov::op::v0)
+_OPENVINO_OP_REG(Equal, ov::op::v1)
+_OPENVINO_OP_REG(Exp, ov::op::v0)
+_OPENVINO_OP_REG(ExtractImagePatches, ov::op::v3)
+_OPENVINO_OP_REG(FakeQuantize, ov::op::v0)
+_OPENVINO_OP_REG(Floor, ov::op::v0)
+_OPENVINO_OP_REG(FloorMod, ov::op::v1)
+_OPENVINO_OP_REG(Gather, ov::op::v1)
+_OPENVINO_OP_REG(GatherTree, ov::op::v1)
+_OPENVINO_OP_REG(Greater, ov::op::v1)
+_OPENVINO_OP_REG(GreaterEqual, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolution, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(GRN, ov::op::v0)
+_OPENVINO_OP_REG(HardSigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Less, ov::op::v1)
+_OPENVINO_OP_REG(LessEqual, ov::op::v1)
+_OPENVINO_OP_REG(Log, ov::op::v0)
+_OPENVINO_OP_REG(LogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(LogicalNot, ov::op::v1)
+_OPENVINO_OP_REG(LogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(LogicalXor, ov::op::v1)
+_OPENVINO_OP_REG(LRN, ov::op::v0)
+_OPENVINO_OP_REG(LSTMCell, ov::op::v4)
+_OPENVINO_OP_REG(MatMul, ov::op::v0)
+_OPENVINO_OP_REG(MaxPool, ov::op::v1)
+_OPENVINO_OP_REG(Maximum, ov::op::v1)
+_OPENVINO_OP_REG(Minimum, ov::op::v1)
+_OPENVINO_OP_REG(Mod, ov::op::v1)
+_OPENVINO_OP_REG(Multiply, ov::op::v1)
+_OPENVINO_OP_REG(MVN, ov::op::v0)
+_OPENVINO_OP_REG(Negative, ov::op::v0)
+_OPENVINO_OP_REG(NormalizeL2, ov::op::v0)
+_OPENVINO_OP_REG(NotEqual, ov::op::v1)
+_OPENVINO_OP_REG(OneHot, ov::op::v1)
+_OPENVINO_OP_REG(PRelu, ov::op::v0)
+_OPENVINO_OP_REG(PSROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(Pad, ov::op::v1)
+_OPENVINO_OP_REG(Parameter, ov::op::v0)
+_OPENVINO_OP_REG(Power, ov::op::v1)
+_OPENVINO_OP_REG(PriorBox, ov::op::v0)
+_OPENVINO_OP_REG(PriorBoxClustered, ov::op::v0)
+_OPENVINO_OP_REG(Proposal, ov::op::v4)
+_OPENVINO_OP_REG(Range, ov::op::v4)
+_OPENVINO_OP_REG(Relu, ov::op::v0)
+_OPENVINO_OP_REG(ReduceMax, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMean, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMin, ov::op::v1)
+_OPENVINO_OP_REG(ReduceProd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceSum, ov::op::v1)
+_OPENVINO_OP_REG(RegionYolo, ov::op::v0)
+_OPENVINO_OP_REG(ReorgYolo, ov::op::v0)
+_OPENVINO_OP_REG(Reshape, ov::op::v1)
+_OPENVINO_OP_REG(Result, ov::op::v0)
+_OPENVINO_OP_REG(ReverseSequence, ov::op::v0)
+_OPENVINO_OP_REG(ROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(ScatterNDUpdate, ov::op::v3)
+_OPENVINO_OP_REG(Select, ov::op::v1)
+_OPENVINO_OP_REG(Selu, ov::op::v0)
+_OPENVINO_OP_REG(Sign, ov::op::v0)
+_OPENVINO_OP_REG(Sigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Sin, ov::op::v0)
+_OPENVINO_OP_REG(Sinh, ov::op::v0)
+_OPENVINO_OP_REG(Softmax, ov::op::v1)
+_OPENVINO_OP_REG(Sqrt, ov::op::v0)
+_OPENVINO_OP_REG(SpaceToDepth, ov::op::v0)
+_OPENVINO_OP_REG(Split, ov::op::v1)
+_OPENVINO_OP_REG(SquaredDifference, ov::op::v0)
+_OPENVINO_OP_REG(Squeeze, ov::op::v0)
+_OPENVINO_OP_REG(StridedSlice, ov::op::v1)
+_OPENVINO_OP_REG(Subtract, ov::op::v1)
+_OPENVINO_OP_REG(Tan, ov::op::v0)
+_OPENVINO_OP_REG(Tanh, ov::op::v0)
+_OPENVINO_OP_REG(TensorIterator, ov::op::v0)
+_OPENVINO_OP_REG(Tile, ov::op::v0)
+_OPENVINO_OP_REG(Transpose, ov::op::v1)
+_OPENVINO_OP_REG(Unsqueeze, ov::op::v0)
+_OPENVINO_OP_REG(VariadicSplit, ov::op::v1)
 
 // New operations added in opset2
-OPENVINO_OP(Gelu, ov::op::v0)
-OPENVINO_OP(BatchToSpace, ov::op::v1)
-OPENVINO_OP(SpaceToBatch, ov::op::v1)
+_OPENVINO_OP_REG(Gelu, ov::op::v0)
+_OPENVINO_OP_REG(BatchToSpace, ov::op::v1)
+_OPENVINO_OP_REG(SpaceToBatch, ov::op::v1)
 
 // New operations added in opset3
-OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
-OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
-OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
-OPENVINO_OP(GRUCell, ov::op::v3)
-OPENVINO_OP(NonZero, ov::op::v3)
-OPENVINO_OP(RNNCell, ov::op::v0)
-OPENVINO_OP(ROIAlign, ov::op::v3)
-OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
-OPENVINO_OP(ScatterUpdate, ov::op::v3)
-OPENVINO_OP(ShuffleChannels, ov::op::v0)
-OPENVINO_OP(ShapeOf, ov::op::v3)
-OPENVINO_OP(Assign, ov::op::v3)
-OPENVINO_OP(ReadValue, ov::op::v3)
-OPENVINO_OP(TopK, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagPackedSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingSegmentsSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagOffsetsSum, ov::op::v3)
+_OPENVINO_OP_REG(GRUCell, ov::op::v3)
+_OPENVINO_OP_REG(NonZero, ov::op::v3)
+_OPENVINO_OP_REG(RNNCell, ov::op::v0)
+_OPENVINO_OP_REG(ROIAlign, ov::op::v3)
+_OPENVINO_OP_REG(ScatterElementsUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ScatterUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ShuffleChannels, ov::op::v0)
+_OPENVINO_OP_REG(ShapeOf, ov::op::v3)
+_OPENVINO_OP_REG(Assign, ov::op::v3)
+_OPENVINO_OP_REG(ReadValue, ov::op::v3)
+_OPENVINO_OP_REG(TopK, ov::op::v3)
 
 // New operations added in opset4
-OPENVINO_OP(Acosh, ov::op::v3)
-OPENVINO_OP(Asinh, ov::op::v3)
-OPENVINO_OP(Atanh, ov::op::v3)
-OPENVINO_OP(CTCLoss, ov::op::v4)
-OPENVINO_OP(HSwish, ov::op::v4)
-OPENVINO_OP(Interpolate, ov::op::v4)
-OPENVINO_OP(Mish, ov::op::v4)
-OPENVINO_OP(NonMaxSuppression, ov::op::v4)
-OPENVINO_OP(ReduceL1, ov::op::v4)
-OPENVINO_OP(ReduceL2, ov::op::v4)
-OPENVINO_OP(SoftPlus, ov::op::v4)
-OPENVINO_OP(Swish, ov::op::v4)
+_OPENVINO_OP_REG(Acosh, ov::op::v3)
+_OPENVINO_OP_REG(Asinh, ov::op::v3)
+_OPENVINO_OP_REG(Atanh, ov::op::v3)
+_OPENVINO_OP_REG(CTCLoss, ov::op::v4)
+_OPENVINO_OP_REG(HSwish, ov::op::v4)
+_OPENVINO_OP_REG(Interpolate, ov::op::v4)
+_OPENVINO_OP_REG(Mish, ov::op::v4)
+_OPENVINO_OP_REG(NonMaxSuppression, ov::op::v4)
+_OPENVINO_OP_REG(ReduceL1, ov::op::v4)
+_OPENVINO_OP_REG(ReduceL2, ov::op::v4)
+_OPENVINO_OP_REG(SoftPlus, ov::op::v4)
+_OPENVINO_OP_REG(Swish, ov::op::v4)
diff --git a/ngraph/core/include/openvino/opsets/opset5.hpp b/ngraph/core/include/openvino/opsets/opset5.hpp
index 736fa00f529..af1d8b32730 100644
--- a/ngraph/core/include/openvino/opsets/opset5.hpp
+++ b/ngraph/core/include/openvino/opsets/opset5.hpp
@@ -8,8 +8,8 @@
 
 namespace ov {
 namespace opset5 {
-#define OPENVINO_OP(a, b) using b::a;
+#define _OPENVINO_OP_REG(a, b) using b::a;
 #include "openvino/opsets/opset5_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
 }  // namespace opset5
 }  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset5_tbl.hpp b/ngraph/core/include/openvino/opsets/opset5_tbl.hpp
index beeeef5395b..df06de8a570 100644
--- a/ngraph/core/include/openvino/opsets/opset5_tbl.hpp
+++ b/ngraph/core/include/openvino/opsets/opset5_tbl.hpp
@@ -2,161 +2,161 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#ifndef OPENVINO_OP
-#    warning "OPENVINO_OP not defined"
-#    define OPENVINO_OP(x, y)
+#ifndef _OPENVINO_OP_REG
+#    warning "_OPENVINO_OP_REG not defined"
+#    define _OPENVINO_OP_REG(x, y)
 #endif
 
-OPENVINO_OP(Abs, ov::op::v0)
-OPENVINO_OP(Acos, ov::op::v0)
-OPENVINO_OP(Add, ov::op::v1)
-OPENVINO_OP(Asin, ov::op::v0)
-OPENVINO_OP(Atan, ov::op::v0)
-OPENVINO_OP(AvgPool, ov::op::v1)
-OPENVINO_OP(BatchNormInference, ov::op::v5)
-OPENVINO_OP(BinaryConvolution, ov::op::v1)
-OPENVINO_OP(Broadcast, ov::op::v3)
-OPENVINO_OP(Bucketize, ov::op::v3)
-OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
-OPENVINO_OP(Ceiling, ov::op::v0)
-OPENVINO_OP(Clamp, ov::op::v0)
-OPENVINO_OP(Concat, ov::op::v0)
-OPENVINO_OP(Constant, ov::op::v0)
-OPENVINO_OP(Convert, ov::op::v0)
-OPENVINO_OP(ConvertLike, ov::op::v1)
-OPENVINO_OP(Convolution, ov::op::v1)
-OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(Cos, ov::op::v0)
-OPENVINO_OP(Cosh, ov::op::v0)
-OPENVINO_OP(CumSum, ov::op::v0)
-OPENVINO_OP(DeformableConvolution, ov::op::v1)
-OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
-OPENVINO_OP(DepthToSpace, ov::op::v0)
-OPENVINO_OP(DetectionOutput, ov::op::v0)
-OPENVINO_OP(Divide, ov::op::v1)
-OPENVINO_OP(Elu, ov::op::v0)
-OPENVINO_OP(Erf, ov::op::v0)
-OPENVINO_OP(Equal, ov::op::v1)
-OPENVINO_OP(Exp, ov::op::v0)
-OPENVINO_OP(ExtractImagePatches, ov::op::v3)
-OPENVINO_OP(FakeQuantize, ov::op::v0)
-OPENVINO_OP(Floor, ov::op::v0)
-OPENVINO_OP(FloorMod, ov::op::v1)
-OPENVINO_OP(Gather, ov::op::v1)
-OPENVINO_OP(GatherTree, ov::op::v1)
-OPENVINO_OP(Greater, ov::op::v1)
-OPENVINO_OP(GreaterEqual, ov::op::v1)
-OPENVINO_OP(GroupConvolution, ov::op::v1)
-OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(GRN, ov::op::v0)
-OPENVINO_OP(HardSigmoid, ov::op::v0)
-OPENVINO_OP(Less, ov::op::v1)
-OPENVINO_OP(LessEqual, ov::op::v1)
-OPENVINO_OP(Log, ov::op::v0)
-OPENVINO_OP(LogicalAnd, ov::op::v1)
-OPENVINO_OP(LogicalNot, ov::op::v1)
-OPENVINO_OP(LogicalOr, ov::op::v1)
-OPENVINO_OP(LogicalXor, ov::op::v1)
-OPENVINO_OP(LRN, ov::op::v0)
-OPENVINO_OP(LSTMCell, ov::op::v4)
-OPENVINO_OP(MatMul, ov::op::v0)
-OPENVINO_OP(MaxPool, ov::op::v1)
-OPENVINO_OP(Maximum, ov::op::v1)
-OPENVINO_OP(Minimum, ov::op::v1)
-OPENVINO_OP(Mod, ov::op::v1)
-OPENVINO_OP(Multiply, ov::op::v1)
-OPENVINO_OP(MVN, ov::op::v0)
-OPENVINO_OP(Negative, ov::op::v0)
-OPENVINO_OP(NormalizeL2, ov::op::v0)
-OPENVINO_OP(NotEqual, ov::op::v1)
-OPENVINO_OP(OneHot, ov::op::v1)
-OPENVINO_OP(PRelu, ov::op::v0)
-OPENVINO_OP(PSROIPooling, ov::op::v0)
-OPENVINO_OP(Pad, ov::op::v1)
-OPENVINO_OP(Parameter, ov::op::v0)
-OPENVINO_OP(Power, ov::op::v1)
-OPENVINO_OP(PriorBox, ov::op::v0)
-OPENVINO_OP(PriorBoxClustered, ov::op::v0)
-OPENVINO_OP(Proposal, ov::op::v4)
-OPENVINO_OP(Range, ov::op::v4)
-OPENVINO_OP(Relu, ov::op::v0)
-OPENVINO_OP(ReduceMax, ov::op::v1)
-OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
-OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
-OPENVINO_OP(ReduceMean, ov::op::v1)
-OPENVINO_OP(ReduceMin, ov::op::v1)
-OPENVINO_OP(ReduceProd, ov::op::v1)
-OPENVINO_OP(ReduceSum, ov::op::v1)
-OPENVINO_OP(RegionYolo, ov::op::v0)
-OPENVINO_OP(ReorgYolo, ov::op::v0)
-OPENVINO_OP(Reshape, ov::op::v1)
-OPENVINO_OP(Result, ov::op::v0)
-OPENVINO_OP(ReverseSequence, ov::op::v0)
-OPENVINO_OP(ROIPooling, ov::op::v0)
-OPENVINO_OP(ScatterNDUpdate, ov::op::v3)
-OPENVINO_OP(Select, ov::op::v1)
-OPENVINO_OP(Selu, ov::op::v0)
-OPENVINO_OP(Sign, ov::op::v0)
-OPENVINO_OP(Sigmoid, ov::op::v0)
-OPENVINO_OP(Sin, ov::op::v0)
-OPENVINO_OP(Sinh, ov::op::v0)
-OPENVINO_OP(Softmax, ov::op::v1)
-OPENVINO_OP(Sqrt, ov::op::v0)
-OPENVINO_OP(SpaceToDepth, ov::op::v0)
-OPENVINO_OP(Split, ov::op::v1)
-OPENVINO_OP(SquaredDifference, ov::op::v0)
-OPENVINO_OP(Squeeze, ov::op::v0)
-OPENVINO_OP(StridedSlice, ov::op::v1)
-OPENVINO_OP(Subtract, ov::op::v1)
-OPENVINO_OP(Tan, ov::op::v0)
-OPENVINO_OP(Tanh, ov::op::v0)
-OPENVINO_OP(TensorIterator, ov::op::v0)
-OPENVINO_OP(Tile, ov::op::v0)
-OPENVINO_OP(Transpose, ov::op::v1)
-OPENVINO_OP(Unsqueeze, ov::op::v0)
-OPENVINO_OP(VariadicSplit, ov::op::v1)
+_OPENVINO_OP_REG(Abs, ov::op::v0)
+_OPENVINO_OP_REG(Acos, ov::op::v0)
+_OPENVINO_OP_REG(Add, ov::op::v1)
+_OPENVINO_OP_REG(Asin, ov::op::v0)
+_OPENVINO_OP_REG(Atan, ov::op::v0)
+_OPENVINO_OP_REG(AvgPool, ov::op::v1)
+_OPENVINO_OP_REG(BatchNormInference, ov::op::v5)
+_OPENVINO_OP_REG(BinaryConvolution, ov::op::v1)
+_OPENVINO_OP_REG(Broadcast, ov::op::v3)
+_OPENVINO_OP_REG(Bucketize, ov::op::v3)
+_OPENVINO_OP_REG(CTCGreedyDecoder, ov::op::v0)
+_OPENVINO_OP_REG(Ceiling, ov::op::v0)
+_OPENVINO_OP_REG(Clamp, ov::op::v0)
+_OPENVINO_OP_REG(Concat, ov::op::v0)
+_OPENVINO_OP_REG(Constant, ov::op::v0)
+_OPENVINO_OP_REG(Convert, ov::op::v0)
+_OPENVINO_OP_REG(ConvertLike, ov::op::v1)
+_OPENVINO_OP_REG(Convolution, ov::op::v1)
+_OPENVINO_OP_REG(ConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(Cos, ov::op::v0)
+_OPENVINO_OP_REG(Cosh, ov::op::v0)
+_OPENVINO_OP_REG(CumSum, ov::op::v0)
+_OPENVINO_OP_REG(DeformableConvolution, ov::op::v1)
+_OPENVINO_OP_REG(DeformablePSROIPooling, ov::op::v1)
+_OPENVINO_OP_REG(DepthToSpace, ov::op::v0)
+_OPENVINO_OP_REG(DetectionOutput, ov::op::v0)
+_OPENVINO_OP_REG(Divide, ov::op::v1)
+_OPENVINO_OP_REG(Elu, ov::op::v0)
+_OPENVINO_OP_REG(Erf, ov::op::v0)
+_OPENVINO_OP_REG(Equal, ov::op::v1)
+_OPENVINO_OP_REG(Exp, ov::op::v0)
+_OPENVINO_OP_REG(ExtractImagePatches, ov::op::v3)
+_OPENVINO_OP_REG(FakeQuantize, ov::op::v0)
+_OPENVINO_OP_REG(Floor, ov::op::v0)
+_OPENVINO_OP_REG(FloorMod, ov::op::v1)
+_OPENVINO_OP_REG(Gather, ov::op::v1)
+_OPENVINO_OP_REG(GatherTree, ov::op::v1)
+_OPENVINO_OP_REG(Greater, ov::op::v1)
+_OPENVINO_OP_REG(GreaterEqual, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolution, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(GRN, ov::op::v0)
+_OPENVINO_OP_REG(HardSigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Less, ov::op::v1)
+_OPENVINO_OP_REG(LessEqual, ov::op::v1)
+_OPENVINO_OP_REG(Log, ov::op::v0)
+_OPENVINO_OP_REG(LogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(LogicalNot, ov::op::v1)
+_OPENVINO_OP_REG(LogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(LogicalXor, ov::op::v1)
+_OPENVINO_OP_REG(LRN, ov::op::v0)
+_OPENVINO_OP_REG(LSTMCell, ov::op::v4)
+_OPENVINO_OP_REG(MatMul, ov::op::v0)
+_OPENVINO_OP_REG(MaxPool, ov::op::v1)
+_OPENVINO_OP_REG(Maximum, ov::op::v1)
+_OPENVINO_OP_REG(Minimum, ov::op::v1)
+_OPENVINO_OP_REG(Mod, ov::op::v1)
+_OPENVINO_OP_REG(Multiply, ov::op::v1)
+_OPENVINO_OP_REG(MVN, ov::op::v0)
+_OPENVINO_OP_REG(Negative, ov::op::v0)
+_OPENVINO_OP_REG(NormalizeL2, ov::op::v0)
+_OPENVINO_OP_REG(NotEqual, ov::op::v1)
+_OPENVINO_OP_REG(OneHot, ov::op::v1)
+_OPENVINO_OP_REG(PRelu, ov::op::v0)
+_OPENVINO_OP_REG(PSROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(Pad, ov::op::v1)
+_OPENVINO_OP_REG(Parameter, ov::op::v0)
+_OPENVINO_OP_REG(Power, ov::op::v1)
+_OPENVINO_OP_REG(PriorBox, ov::op::v0)
+_OPENVINO_OP_REG(PriorBoxClustered, ov::op::v0)
+_OPENVINO_OP_REG(Proposal, ov::op::v4)
+_OPENVINO_OP_REG(Range, ov::op::v4)
+_OPENVINO_OP_REG(Relu, ov::op::v0)
+_OPENVINO_OP_REG(ReduceMax, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMean, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMin, ov::op::v1)
+_OPENVINO_OP_REG(ReduceProd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceSum, ov::op::v1)
+_OPENVINO_OP_REG(RegionYolo, ov::op::v0)
+_OPENVINO_OP_REG(ReorgYolo, ov::op::v0)
+_OPENVINO_OP_REG(Reshape, ov::op::v1)
+_OPENVINO_OP_REG(Result, ov::op::v0)
+_OPENVINO_OP_REG(ReverseSequence, ov::op::v0)
+_OPENVINO_OP_REG(ROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(ScatterNDUpdate, ov::op::v3)
+_OPENVINO_OP_REG(Select, ov::op::v1)
+_OPENVINO_OP_REG(Selu, ov::op::v0)
+_OPENVINO_OP_REG(Sign, ov::op::v0)
+_OPENVINO_OP_REG(Sigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Sin, ov::op::v0)
+_OPENVINO_OP_REG(Sinh, ov::op::v0)
+_OPENVINO_OP_REG(Softmax, ov::op::v1)
+_OPENVINO_OP_REG(Sqrt, ov::op::v0)
+_OPENVINO_OP_REG(SpaceToDepth, ov::op::v0)
+_OPENVINO_OP_REG(Split, ov::op::v1)
+_OPENVINO_OP_REG(SquaredDifference, ov::op::v0)
+_OPENVINO_OP_REG(Squeeze, ov::op::v0)
+_OPENVINO_OP_REG(StridedSlice, ov::op::v1)
+_OPENVINO_OP_REG(Subtract, ov::op::v1)
+_OPENVINO_OP_REG(Tan, ov::op::v0)
+_OPENVINO_OP_REG(Tanh, ov::op::v0)
+_OPENVINO_OP_REG(TensorIterator, ov::op::v0)
+_OPENVINO_OP_REG(Tile, ov::op::v0)
+_OPENVINO_OP_REG(Transpose, ov::op::v1)
+_OPENVINO_OP_REG(Unsqueeze, ov::op::v0)
+_OPENVINO_OP_REG(VariadicSplit, ov::op::v1)
 
 // New operations added in opset2
-OPENVINO_OP(Gelu, ov::op::v0)
-OPENVINO_OP(BatchToSpace, ov::op::v1)
-OPENVINO_OP(SpaceToBatch, ov::op::v1)
+_OPENVINO_OP_REG(Gelu, ov::op::v0)
+_OPENVINO_OP_REG(BatchToSpace, ov::op::v1)
+_OPENVINO_OP_REG(SpaceToBatch, ov::op::v1)
 
 // New operations added in opset3
-OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
-OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
-OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
-OPENVINO_OP(GRUCell, ov::op::v3)
-OPENVINO_OP(NonZero, ov::op::v3)
-OPENVINO_OP(RNNCell, ov::op::v0)
-OPENVINO_OP(ROIAlign, ov::op::v3)
-OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
-OPENVINO_OP(ScatterUpdate, ov::op::v3)
-OPENVINO_OP(ShuffleChannels, ov::op::v0)
-OPENVINO_OP(ShapeOf, ov::op::v3)
-OPENVINO_OP(Assign, ov::op::v3)
-OPENVINO_OP(ReadValue, ov::op::v3)
-OPENVINO_OP(TopK, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagPackedSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingSegmentsSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagOffsetsSum, ov::op::v3)
+_OPENVINO_OP_REG(GRUCell, ov::op::v3)
+_OPENVINO_OP_REG(NonZero, ov::op::v3)
+_OPENVINO_OP_REG(RNNCell, ov::op::v0)
+_OPENVINO_OP_REG(ROIAlign, ov::op::v3)
+_OPENVINO_OP_REG(ScatterElementsUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ScatterUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ShuffleChannels, ov::op::v0)
+_OPENVINO_OP_REG(ShapeOf, ov::op::v3)
+_OPENVINO_OP_REG(Assign, ov::op::v3)
+_OPENVINO_OP_REG(ReadValue, ov::op::v3)
+_OPENVINO_OP_REG(TopK, ov::op::v3)
 
 // New operations added in opset4
-OPENVINO_OP(Acosh, ov::op::v3)
-OPENVINO_OP(Asinh, ov::op::v3)
-OPENVINO_OP(Atanh, ov::op::v3)
-OPENVINO_OP(CTCLoss, ov::op::v4)
-OPENVINO_OP(HSwish, ov::op::v4)
-OPENVINO_OP(Interpolate, ov::op::v4)
-OPENVINO_OP(Mish, ov::op::v4)
-OPENVINO_OP(ReduceL1, ov::op::v4)
-OPENVINO_OP(ReduceL2, ov::op::v4)
-OPENVINO_OP(SoftPlus, ov::op::v4)
-OPENVINO_OP(Swish, ov::op::v4)
+_OPENVINO_OP_REG(Acosh, ov::op::v3)
+_OPENVINO_OP_REG(Asinh, ov::op::v3)
+_OPENVINO_OP_REG(Atanh, ov::op::v3)
+_OPENVINO_OP_REG(CTCLoss, ov::op::v4)
+_OPENVINO_OP_REG(HSwish, ov::op::v4)
+_OPENVINO_OP_REG(Interpolate, ov::op::v4)
+_OPENVINO_OP_REG(Mish, ov::op::v4)
+_OPENVINO_OP_REG(ReduceL1, ov::op::v4)
+_OPENVINO_OP_REG(ReduceL2, ov::op::v4)
+_OPENVINO_OP_REG(SoftPlus, ov::op::v4)
+_OPENVINO_OP_REG(Swish, ov::op::v4)
 
 // New operations added in opset5
-OPENVINO_OP(GatherND, ov::op::v5)
-OPENVINO_OP(GRUSequence, ov::op::v5)
-OPENVINO_OP(HSigmoid, ov::op::v5)
-OPENVINO_OP(LogSoftmax, ov::op::v5)
-OPENVINO_OP(Loop, ov::op::v5)
-OPENVINO_OP(LSTMSequence, ov::op::v5)
-OPENVINO_OP(NonMaxSuppression, ov::op::v5)
-OPENVINO_OP(RNNSequence, ov::op::v5)
-OPENVINO_OP(Round, ov::op::v5)
+_OPENVINO_OP_REG(GatherND, ov::op::v5)
+_OPENVINO_OP_REG(GRUSequence, ov::op::v5)
+_OPENVINO_OP_REG(HSigmoid, ov::op::v5)
+_OPENVINO_OP_REG(LogSoftmax, ov::op::v5)
+_OPENVINO_OP_REG(Loop, ov::op::v5)
+_OPENVINO_OP_REG(LSTMSequence, ov::op::v5)
+_OPENVINO_OP_REG(NonMaxSuppression, ov::op::v5)
+_OPENVINO_OP_REG(RNNSequence, ov::op::v5)
+_OPENVINO_OP_REG(Round, ov::op::v5)
diff --git a/ngraph/core/include/openvino/opsets/opset6.hpp b/ngraph/core/include/openvino/opsets/opset6.hpp
index 82b792da09a..350881c422b 100644
--- a/ngraph/core/include/openvino/opsets/opset6.hpp
+++ b/ngraph/core/include/openvino/opsets/opset6.hpp
@@ -8,8 +8,8 @@
 
 namespace ov {
 namespace opset6 {
-#define OPENVINO_OP(a, b) using b::a;
+#define _OPENVINO_OP_REG(a, b) using b::a;
 #include "openvino/opsets/opset6_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
 }  // namespace opset6
 }  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset6_tbl.hpp b/ngraph/core/include/openvino/opsets/opset6_tbl.hpp
index eb23908c61d..ce4a29ef30c 100644
--- a/ngraph/core/include/openvino/opsets/opset6_tbl.hpp
+++ b/ngraph/core/include/openvino/opsets/opset6_tbl.hpp
@@ -2,170 +2,170 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#ifndef OPENVINO_OP
-#    warning "OPENVINO_OP not defined"
-#    define OPENVINO_OP(x, y)
+#ifndef _OPENVINO_OP_REG
+#    warning "_OPENVINO_OP_REG not defined"
+#    define _OPENVINO_OP_REG(x, y)
 #endif
 
-OPENVINO_OP(Abs, ov::op::v0)
-OPENVINO_OP(Acos, ov::op::v0)
-OPENVINO_OP(Add, ov::op::v1)
-OPENVINO_OP(Asin, ov::op::v0)
-OPENVINO_OP(Atan, ov::op::v0)
-OPENVINO_OP(AvgPool, ov::op::v1)
-OPENVINO_OP(BatchNormInference, ov::op::v5)
-OPENVINO_OP(BinaryConvolution, ov::op::v1)
-OPENVINO_OP(Broadcast, ov::op::v3)
-OPENVINO_OP(Bucketize, ov::op::v3)
-OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
-OPENVINO_OP(Ceiling, ov::op::v0)
-OPENVINO_OP(Clamp, ov::op::v0)
-OPENVINO_OP(Concat, ov::op::v0)
-OPENVINO_OP(Constant, ov::op::v0)
-OPENVINO_OP(Convert, ov::op::v0)
-OPENVINO_OP(ConvertLike, ov::op::v1)
-OPENVINO_OP(Convolution, ov::op::v1)
-OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(Cos, ov::op::v0)
-OPENVINO_OP(Cosh, ov::op::v0)
-OPENVINO_OP(CumSum, ov::op::v0)
-OPENVINO_OP(DeformableConvolution, ov::op::v1)
-OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
-OPENVINO_OP(DepthToSpace, ov::op::v0)
-OPENVINO_OP(DetectionOutput, ov::op::v0)
-OPENVINO_OP(Divide, ov::op::v1)
-OPENVINO_OP(Elu, ov::op::v0)
-OPENVINO_OP(Erf, ov::op::v0)
-OPENVINO_OP(Equal, ov::op::v1)
-OPENVINO_OP(Exp, ov::op::v0)
-OPENVINO_OP(ExtractImagePatches, ov::op::v3)
-OPENVINO_OP(FakeQuantize, ov::op::v0)
-OPENVINO_OP(Floor, ov::op::v0)
-OPENVINO_OP(FloorMod, ov::op::v1)
-OPENVINO_OP(Gather, ov::op::v1)
-OPENVINO_OP(GatherTree, ov::op::v1)
-OPENVINO_OP(Greater, ov::op::v1)
-OPENVINO_OP(GreaterEqual, ov::op::v1)
-OPENVINO_OP(GroupConvolution, ov::op::v1)
-OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(GRN, ov::op::v0)
-OPENVINO_OP(HardSigmoid, ov::op::v0)
-OPENVINO_OP(Less, ov::op::v1)
-OPENVINO_OP(LessEqual, ov::op::v1)
-OPENVINO_OP(Log, ov::op::v0)
-OPENVINO_OP(LogicalAnd, ov::op::v1)
-OPENVINO_OP(LogicalNot, ov::op::v1)
-OPENVINO_OP(LogicalOr, ov::op::v1)
-OPENVINO_OP(LogicalXor, ov::op::v1)
-OPENVINO_OP(LRN, ov::op::v0)
-OPENVINO_OP(LSTMCell, ov::op::v4)
-OPENVINO_OP(MatMul, ov::op::v0)
-OPENVINO_OP(MaxPool, ov::op::v1)
-OPENVINO_OP(Maximum, ov::op::v1)
-OPENVINO_OP(Minimum, ov::op::v1)
-OPENVINO_OP(Mod, ov::op::v1)
-OPENVINO_OP(Multiply, ov::op::v1)
-OPENVINO_OP(Negative, ov::op::v0)
-OPENVINO_OP(NormalizeL2, ov::op::v0)
-OPENVINO_OP(NotEqual, ov::op::v1)
-OPENVINO_OP(OneHot, ov::op::v1)
-OPENVINO_OP(PRelu, ov::op::v0)
-OPENVINO_OP(PSROIPooling, ov::op::v0)
-OPENVINO_OP(Pad, ov::op::v1)
-OPENVINO_OP(Parameter, ov::op::v0)
-OPENVINO_OP(Power, ov::op::v1)
-OPENVINO_OP(PriorBox, ov::op::v0)
-OPENVINO_OP(PriorBoxClustered, ov::op::v0)
-OPENVINO_OP(Proposal, ov::op::v4)
-OPENVINO_OP(Range, ov::op::v4)
-OPENVINO_OP(Relu, ov::op::v0)
-OPENVINO_OP(ReduceMax, ov::op::v1)
-OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
-OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
-OPENVINO_OP(ReduceMean, ov::op::v1)
-OPENVINO_OP(ReduceMin, ov::op::v1)
-OPENVINO_OP(ReduceProd, ov::op::v1)
-OPENVINO_OP(ReduceSum, ov::op::v1)
-OPENVINO_OP(RegionYolo, ov::op::v0)
-OPENVINO_OP(ReorgYolo, ov::op::v0)
-OPENVINO_OP(Reshape, ov::op::v1)
-OPENVINO_OP(Result, ov::op::v0)
-OPENVINO_OP(ReverseSequence, ov::op::v0)
-OPENVINO_OP(ROIPooling, ov::op::v0)
-OPENVINO_OP(ScatterNDUpdate, ov::op::v3)
-OPENVINO_OP(Select, ov::op::v1)
-OPENVINO_OP(Selu, ov::op::v0)
-OPENVINO_OP(Sign, ov::op::v0)
-OPENVINO_OP(Sigmoid, ov::op::v0)
-OPENVINO_OP(Sin, ov::op::v0)
-OPENVINO_OP(Sinh, ov::op::v0)
-OPENVINO_OP(Softmax, ov::op::v1)
-OPENVINO_OP(Sqrt, ov::op::v0)
-OPENVINO_OP(SpaceToDepth, ov::op::v0)
-OPENVINO_OP(Split, ov::op::v1)
-OPENVINO_OP(SquaredDifference, ov::op::v0)
-OPENVINO_OP(Squeeze, ov::op::v0)
-OPENVINO_OP(StridedSlice, ov::op::v1)
-OPENVINO_OP(Subtract, ov::op::v1)
-OPENVINO_OP(Tan, ov::op::v0)
-OPENVINO_OP(Tanh, ov::op::v0)
-OPENVINO_OP(TensorIterator, ov::op::v0)
-OPENVINO_OP(Tile, ov::op::v0)
-OPENVINO_OP(Transpose, ov::op::v1)
-OPENVINO_OP(Unsqueeze, ov::op::v0)
-OPENVINO_OP(VariadicSplit, ov::op::v1)
+_OPENVINO_OP_REG(Abs, ov::op::v0)
+_OPENVINO_OP_REG(Acos, ov::op::v0)
+_OPENVINO_OP_REG(Add, ov::op::v1)
+_OPENVINO_OP_REG(Asin, ov::op::v0)
+_OPENVINO_OP_REG(Atan, ov::op::v0)
+_OPENVINO_OP_REG(AvgPool, ov::op::v1)
+_OPENVINO_OP_REG(BatchNormInference, ov::op::v5)
+_OPENVINO_OP_REG(BinaryConvolution, ov::op::v1)
+_OPENVINO_OP_REG(Broadcast, ov::op::v3)
+_OPENVINO_OP_REG(Bucketize, ov::op::v3)
+_OPENVINO_OP_REG(CTCGreedyDecoder, ov::op::v0)
+_OPENVINO_OP_REG(Ceiling, ov::op::v0)
+_OPENVINO_OP_REG(Clamp, ov::op::v0)
+_OPENVINO_OP_REG(Concat, ov::op::v0)
+_OPENVINO_OP_REG(Constant, ov::op::v0)
+_OPENVINO_OP_REG(Convert, ov::op::v0)
+_OPENVINO_OP_REG(ConvertLike, ov::op::v1)
+_OPENVINO_OP_REG(Convolution, ov::op::v1)
+_OPENVINO_OP_REG(ConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(Cos, ov::op::v0)
+_OPENVINO_OP_REG(Cosh, ov::op::v0)
+_OPENVINO_OP_REG(CumSum, ov::op::v0)
+_OPENVINO_OP_REG(DeformableConvolution, ov::op::v1)
+_OPENVINO_OP_REG(DeformablePSROIPooling, ov::op::v1)
+_OPENVINO_OP_REG(DepthToSpace, ov::op::v0)
+_OPENVINO_OP_REG(DetectionOutput, ov::op::v0)
+_OPENVINO_OP_REG(Divide, ov::op::v1)
+_OPENVINO_OP_REG(Elu, ov::op::v0)
+_OPENVINO_OP_REG(Erf, ov::op::v0)
+_OPENVINO_OP_REG(Equal, ov::op::v1)
+_OPENVINO_OP_REG(Exp, ov::op::v0)
+_OPENVINO_OP_REG(ExtractImagePatches, ov::op::v3)
+_OPENVINO_OP_REG(FakeQuantize, ov::op::v0)
+_OPENVINO_OP_REG(Floor, ov::op::v0)
+_OPENVINO_OP_REG(FloorMod, ov::op::v1)
+_OPENVINO_OP_REG(Gather, ov::op::v1)
+_OPENVINO_OP_REG(GatherTree, ov::op::v1)
+_OPENVINO_OP_REG(Greater, ov::op::v1)
+_OPENVINO_OP_REG(GreaterEqual, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolution, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(GRN, ov::op::v0)
+_OPENVINO_OP_REG(HardSigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Less, ov::op::v1)
+_OPENVINO_OP_REG(LessEqual, ov::op::v1)
+_OPENVINO_OP_REG(Log, ov::op::v0)
+_OPENVINO_OP_REG(LogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(LogicalNot, ov::op::v1)
+_OPENVINO_OP_REG(LogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(LogicalXor, ov::op::v1)
+_OPENVINO_OP_REG(LRN, ov::op::v0)
+_OPENVINO_OP_REG(LSTMCell, ov::op::v4)
+_OPENVINO_OP_REG(MatMul, ov::op::v0)
+_OPENVINO_OP_REG(MaxPool, ov::op::v1)
+_OPENVINO_OP_REG(Maximum, ov::op::v1)
+_OPENVINO_OP_REG(Minimum, ov::op::v1)
+_OPENVINO_OP_REG(Mod, ov::op::v1)
+_OPENVINO_OP_REG(Multiply, ov::op::v1)
+_OPENVINO_OP_REG(Negative, ov::op::v0)
+_OPENVINO_OP_REG(NormalizeL2, ov::op::v0)
+_OPENVINO_OP_REG(NotEqual, ov::op::v1)
+_OPENVINO_OP_REG(OneHot, ov::op::v1)
+_OPENVINO_OP_REG(PRelu, ov::op::v0)
+_OPENVINO_OP_REG(PSROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(Pad, ov::op::v1)
+_OPENVINO_OP_REG(Parameter, ov::op::v0)
+_OPENVINO_OP_REG(Power, ov::op::v1)
+_OPENVINO_OP_REG(PriorBox, ov::op::v0)
+_OPENVINO_OP_REG(PriorBoxClustered, ov::op::v0)
+_OPENVINO_OP_REG(Proposal, ov::op::v4)
+_OPENVINO_OP_REG(Range, ov::op::v4)
+_OPENVINO_OP_REG(Relu, ov::op::v0)
+_OPENVINO_OP_REG(ReduceMax, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMean, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMin, ov::op::v1)
+_OPENVINO_OP_REG(ReduceProd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceSum, ov::op::v1)
+_OPENVINO_OP_REG(RegionYolo, ov::op::v0)
+_OPENVINO_OP_REG(ReorgYolo, ov::op::v0)
+_OPENVINO_OP_REG(Reshape, ov::op::v1)
+_OPENVINO_OP_REG(Result, ov::op::v0)
+_OPENVINO_OP_REG(ReverseSequence, ov::op::v0)
+_OPENVINO_OP_REG(ROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(ScatterNDUpdate, ov::op::v3)
+_OPENVINO_OP_REG(Select, ov::op::v1)
+_OPENVINO_OP_REG(Selu, ov::op::v0)
+_OPENVINO_OP_REG(Sign, ov::op::v0)
+_OPENVINO_OP_REG(Sigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Sin, ov::op::v0)
+_OPENVINO_OP_REG(Sinh, ov::op::v0)
+_OPENVINO_OP_REG(Softmax, ov::op::v1)
+_OPENVINO_OP_REG(Sqrt, ov::op::v0)
+_OPENVINO_OP_REG(SpaceToDepth, ov::op::v0)
+_OPENVINO_OP_REG(Split, ov::op::v1)
+_OPENVINO_OP_REG(SquaredDifference, ov::op::v0)
+_OPENVINO_OP_REG(Squeeze, ov::op::v0)
+_OPENVINO_OP_REG(StridedSlice, ov::op::v1)
+_OPENVINO_OP_REG(Subtract, ov::op::v1)
+_OPENVINO_OP_REG(Tan, ov::op::v0)
+_OPENVINO_OP_REG(Tanh, ov::op::v0)
+_OPENVINO_OP_REG(TensorIterator, ov::op::v0)
+_OPENVINO_OP_REG(Tile, ov::op::v0)
+_OPENVINO_OP_REG(Transpose, ov::op::v1)
+_OPENVINO_OP_REG(Unsqueeze, ov::op::v0)
+_OPENVINO_OP_REG(VariadicSplit, ov::op::v1)
 
 // New operations added in opset2
-OPENVINO_OP(Gelu, ov::op::v0)
-OPENVINO_OP(BatchToSpace, ov::op::v1)
-OPENVINO_OP(SpaceToBatch, ov::op::v1)
+_OPENVINO_OP_REG(Gelu, ov::op::v0)
+_OPENVINO_OP_REG(BatchToSpace, ov::op::v1)
+_OPENVINO_OP_REG(SpaceToBatch, ov::op::v1)
 
 // New operations added in opset3
-OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
-OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
-OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
-OPENVINO_OP(GRUCell, ov::op::v3)
-OPENVINO_OP(NonZero, ov::op::v3)
-OPENVINO_OP(RNNCell, ov::op::v0)
-OPENVINO_OP(ROIAlign, ov::op::v3)
-OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
-OPENVINO_OP(ScatterUpdate, ov::op::v3)
-OPENVINO_OP(ShuffleChannels, ov::op::v0)
-OPENVINO_OP(ShapeOf, ov::op::v3)
-OPENVINO_OP(TopK, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagPackedSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingSegmentsSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagOffsetsSum, ov::op::v3)
+_OPENVINO_OP_REG(GRUCell, ov::op::v3)
+_OPENVINO_OP_REG(NonZero, ov::op::v3)
+_OPENVINO_OP_REG(RNNCell, ov::op::v0)
+_OPENVINO_OP_REG(ROIAlign, ov::op::v3)
+_OPENVINO_OP_REG(ScatterElementsUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ScatterUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ShuffleChannels, ov::op::v0)
+_OPENVINO_OP_REG(ShapeOf, ov::op::v3)
+_OPENVINO_OP_REG(TopK, ov::op::v3)
 
 // New operations added in opset4
-OPENVINO_OP(Acosh, ov::op::v3)
-OPENVINO_OP(Asinh, ov::op::v3)
-OPENVINO_OP(Atanh, ov::op::v3)
-OPENVINO_OP(CTCLoss, ov::op::v4)
-OPENVINO_OP(HSwish, ov::op::v4)
-OPENVINO_OP(Interpolate, ov::op::v4)
-OPENVINO_OP(Mish, ov::op::v4)
-OPENVINO_OP(ReduceL1, ov::op::v4)
-OPENVINO_OP(ReduceL2, ov::op::v4)
-OPENVINO_OP(SoftPlus, ov::op::v4)
-OPENVINO_OP(Swish, ov::op::v4)
+_OPENVINO_OP_REG(Acosh, ov::op::v3)
+_OPENVINO_OP_REG(Asinh, ov::op::v3)
+_OPENVINO_OP_REG(Atanh, ov::op::v3)
+_OPENVINO_OP_REG(CTCLoss, ov::op::v4)
+_OPENVINO_OP_REG(HSwish, ov::op::v4)
+_OPENVINO_OP_REG(Interpolate, ov::op::v4)
+_OPENVINO_OP_REG(Mish, ov::op::v4)
+_OPENVINO_OP_REG(ReduceL1, ov::op::v4)
+_OPENVINO_OP_REG(ReduceL2, ov::op::v4)
+_OPENVINO_OP_REG(SoftPlus, ov::op::v4)
+_OPENVINO_OP_REG(Swish, ov::op::v4)
 
 // New operations added in opset5
-OPENVINO_OP(GatherND, ov::op::v5)
-OPENVINO_OP(GRUSequence, ov::op::v5)
-OPENVINO_OP(HSigmoid, ov::op::v5)
-OPENVINO_OP(LogSoftmax, ov::op::v5)
-OPENVINO_OP(Loop, ov::op::v5)
-OPENVINO_OP(LSTMSequence, ov::op::v5)
-OPENVINO_OP(NonMaxSuppression, ov::op::v5)
-OPENVINO_OP(RNNSequence, ov::op::v5)
-OPENVINO_OP(Round, ov::op::v5)
+_OPENVINO_OP_REG(GatherND, ov::op::v5)
+_OPENVINO_OP_REG(GRUSequence, ov::op::v5)
+_OPENVINO_OP_REG(HSigmoid, ov::op::v5)
+_OPENVINO_OP_REG(LogSoftmax, ov::op::v5)
+_OPENVINO_OP_REG(Loop, ov::op::v5)
+_OPENVINO_OP_REG(LSTMSequence, ov::op::v5)
+_OPENVINO_OP_REG(NonMaxSuppression, ov::op::v5)
+_OPENVINO_OP_REG(RNNSequence, ov::op::v5)
+_OPENVINO_OP_REG(Round, ov::op::v5)
 
 // New operations added in opset6
-OPENVINO_OP(CTCGreedyDecoderSeqLen, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronDetectionOutput, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronGenerateProposalsSingleImage, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronPriorGridGenerator, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronROIFeatureExtractor, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronTopKROIs, ov::op::v6)
-OPENVINO_OP(GatherElements, ov::op::v6)
-OPENVINO_OP(MVN, ov::op::v6)
-OPENVINO_OP(Assign, ov::op::v6)     // new version
-OPENVINO_OP(ReadValue, ov::op::v6)  // new version
+_OPENVINO_OP_REG(CTCGreedyDecoderSeqLen, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronDetectionOutput, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronGenerateProposalsSingleImage, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronPriorGridGenerator, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronROIFeatureExtractor, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronTopKROIs, ov::op::v6)
+_OPENVINO_OP_REG(GatherElements, ov::op::v6)
+_OPENVINO_OP_REG(MVN, ov::op::v6)
+_OPENVINO_OP_REG(Assign, ov::op::v6)     // new version
+_OPENVINO_OP_REG(ReadValue, ov::op::v6)  // new version
diff --git a/ngraph/core/include/openvino/opsets/opset7.hpp b/ngraph/core/include/openvino/opsets/opset7.hpp
index 87343585747..d6beb736e97 100644
--- a/ngraph/core/include/openvino/opsets/opset7.hpp
+++ b/ngraph/core/include/openvino/opsets/opset7.hpp
@@ -8,8 +8,8 @@
 
 namespace ov {
 namespace opset7 {
-#define OPENVINO_OP(a, b) using b::a;
+#define _OPENVINO_OP_REG(a, b) using b::a;
 #include "openvino/opsets/opset7_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
 }  // namespace opset7
 }  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset7_tbl.hpp b/ngraph/core/include/openvino/opsets/opset7_tbl.hpp
index 169a0534dd0..8643ac2decd 100644
--- a/ngraph/core/include/openvino/opsets/opset7_tbl.hpp
+++ b/ngraph/core/include/openvino/opsets/opset7_tbl.hpp
@@ -2,176 +2,176 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#ifndef OPENVINO_OP
-#    warning "OPENVINO_OP not defined"
-#    define OPENVINO_OP(x, y)
+#ifndef _OPENVINO_OP_REG
+#    warning "_OPENVINO_OP_REG not defined"
+#    define _OPENVINO_OP_REG(x, y)
 #endif
 
-OPENVINO_OP(Abs, ov::op::v0)
-OPENVINO_OP(Acos, ov::op::v0)
-OPENVINO_OP(Add, ov::op::v1)
-OPENVINO_OP(Asin, ov::op::v0)
-OPENVINO_OP(Atan, ov::op::v0)
-OPENVINO_OP(AvgPool, ov::op::v1)
-OPENVINO_OP(BatchNormInference, ov::op::v5)
-OPENVINO_OP(BinaryConvolution, ov::op::v1)
-OPENVINO_OP(Broadcast, ov::op::v3)
-OPENVINO_OP(Bucketize, ov::op::v3)
-OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
-OPENVINO_OP(Ceiling, ov::op::v0)
-OPENVINO_OP(Clamp, ov::op::v0)
-OPENVINO_OP(Concat, ov::op::v0)
-OPENVINO_OP(Constant, ov::op::v0)
-OPENVINO_OP(Convert, ov::op::v0)
-OPENVINO_OP(ConvertLike, ov::op::v1)
-OPENVINO_OP(Convolution, ov::op::v1)
-OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(Cos, ov::op::v0)
-OPENVINO_OP(Cosh, ov::op::v0)
-OPENVINO_OP(CumSum, ov::op::v0)
-OPENVINO_OP(DeformableConvolution, ov::op::v1)
-OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
-OPENVINO_OP(DepthToSpace, ov::op::v0)
-OPENVINO_OP(DetectionOutput, ov::op::v0)
-OPENVINO_OP(Divide, ov::op::v1)
-OPENVINO_OP(Elu, ov::op::v0)
-OPENVINO_OP(Erf, ov::op::v0)
-OPENVINO_OP(Equal, ov::op::v1)
-OPENVINO_OP(Exp, ov::op::v0)
-OPENVINO_OP(ExtractImagePatches, ov::op::v3)
-OPENVINO_OP(FakeQuantize, ov::op::v0)
-OPENVINO_OP(Floor, ov::op::v0)
-OPENVINO_OP(FloorMod, ov::op::v1)
-OPENVINO_OP(Gather, ov::op::v7)
-OPENVINO_OP(GatherTree, ov::op::v1)
-OPENVINO_OP(Greater, ov::op::v1)
-OPENVINO_OP(GreaterEqual, ov::op::v1)
-OPENVINO_OP(GroupConvolution, ov::op::v1)
-OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(GRN, ov::op::v0)
-OPENVINO_OP(HardSigmoid, ov::op::v0)
-OPENVINO_OP(Less, ov::op::v1)
-OPENVINO_OP(LessEqual, ov::op::v1)
-OPENVINO_OP(Log, ov::op::v0)
-OPENVINO_OP(LogicalAnd, ov::op::v1)
-OPENVINO_OP(LogicalNot, ov::op::v1)
-OPENVINO_OP(LogicalOr, ov::op::v1)
-OPENVINO_OP(LogicalXor, ov::op::v1)
-OPENVINO_OP(LRN, ov::op::v0)
-OPENVINO_OP(LSTMCell, ov::op::v4)
-OPENVINO_OP(MatMul, ov::op::v0)
-OPENVINO_OP(MaxPool, ov::op::v1)
-OPENVINO_OP(Maximum, ov::op::v1)
-OPENVINO_OP(Minimum, ov::op::v1)
-OPENVINO_OP(Mod, ov::op::v1)
-OPENVINO_OP(Multiply, ov::op::v1)
-OPENVINO_OP(Negative, ov::op::v0)
-OPENVINO_OP(NormalizeL2, ov::op::v0)
-OPENVINO_OP(NotEqual, ov::op::v1)
-OPENVINO_OP(OneHot, ov::op::v1)
-OPENVINO_OP(PRelu, ov::op::v0)
-OPENVINO_OP(PSROIPooling, ov::op::v0)
-OPENVINO_OP(Pad, ov::op::v1)
-OPENVINO_OP(Parameter, ov::op::v0)
-OPENVINO_OP(Power, ov::op::v1)
-OPENVINO_OP(PriorBox, ov::op::v0)
-OPENVINO_OP(PriorBoxClustered, ov::op::v0)
-OPENVINO_OP(Proposal, ov::op::v4)
-OPENVINO_OP(Range, ov::op::v4)
-OPENVINO_OP(Relu, ov::op::v0)
-OPENVINO_OP(ReduceMax, ov::op::v1)
-OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
-OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
-OPENVINO_OP(ReduceMean, ov::op::v1)
-OPENVINO_OP(ReduceMin, ov::op::v1)
-OPENVINO_OP(ReduceProd, ov::op::v1)
-OPENVINO_OP(ReduceSum, ov::op::v1)
-OPENVINO_OP(RegionYolo, ov::op::v0)
-OPENVINO_OP(ReorgYolo, ov::op::v0)
-OPENVINO_OP(Reshape, ov::op::v1)
-OPENVINO_OP(Result, ov::op::v0)
-OPENVINO_OP(ReverseSequence, ov::op::v0)
-OPENVINO_OP(ROIPooling, ov::op::v0)
-OPENVINO_OP(ScatterNDUpdate, ov::op::v3)
-OPENVINO_OP(Select, ov::op::v1)
-OPENVINO_OP(Selu, ov::op::v0)
-OPENVINO_OP(Sign, ov::op::v0)
-OPENVINO_OP(Sigmoid, ov::op::v0)
-OPENVINO_OP(Sin, ov::op::v0)
-OPENVINO_OP(Sinh, ov::op::v0)
-OPENVINO_OP(Softmax, ov::op::v1)
-OPENVINO_OP(Sqrt, ov::op::v0)
-OPENVINO_OP(SpaceToDepth, ov::op::v0)
-OPENVINO_OP(Split, ov::op::v1)
-OPENVINO_OP(SquaredDifference, ov::op::v0)
-OPENVINO_OP(Squeeze, ov::op::v0)
-OPENVINO_OP(StridedSlice, ov::op::v1)
-OPENVINO_OP(Subtract, ov::op::v1)
-OPENVINO_OP(Tan, ov::op::v0)
-OPENVINO_OP(Tanh, ov::op::v0)
-OPENVINO_OP(TensorIterator, ov::op::v0)
-OPENVINO_OP(Tile, ov::op::v0)
-OPENVINO_OP(Transpose, ov::op::v1)
-OPENVINO_OP(Unsqueeze, ov::op::v0)
-OPENVINO_OP(VariadicSplit, ov::op::v1)
+_OPENVINO_OP_REG(Abs, ov::op::v0)
+_OPENVINO_OP_REG(Acos, ov::op::v0)
+_OPENVINO_OP_REG(Add, ov::op::v1)
+_OPENVINO_OP_REG(Asin, ov::op::v0)
+_OPENVINO_OP_REG(Atan, ov::op::v0)
+_OPENVINO_OP_REG(AvgPool, ov::op::v1)
+_OPENVINO_OP_REG(BatchNormInference, ov::op::v5)
+_OPENVINO_OP_REG(BinaryConvolution, ov::op::v1)
+_OPENVINO_OP_REG(Broadcast, ov::op::v3)
+_OPENVINO_OP_REG(Bucketize, ov::op::v3)
+_OPENVINO_OP_REG(CTCGreedyDecoder, ov::op::v0)
+_OPENVINO_OP_REG(Ceiling, ov::op::v0)
+_OPENVINO_OP_REG(Clamp, ov::op::v0)
+_OPENVINO_OP_REG(Concat, ov::op::v0)
+_OPENVINO_OP_REG(Constant, ov::op::v0)
+_OPENVINO_OP_REG(Convert, ov::op::v0)
+_OPENVINO_OP_REG(ConvertLike, ov::op::v1)
+_OPENVINO_OP_REG(Convolution, ov::op::v1)
+_OPENVINO_OP_REG(ConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(Cos, ov::op::v0)
+_OPENVINO_OP_REG(Cosh, ov::op::v0)
+_OPENVINO_OP_REG(CumSum, ov::op::v0)
+_OPENVINO_OP_REG(DeformableConvolution, ov::op::v1)
+_OPENVINO_OP_REG(DeformablePSROIPooling, ov::op::v1)
+_OPENVINO_OP_REG(DepthToSpace, ov::op::v0)
+_OPENVINO_OP_REG(DetectionOutput, ov::op::v0)
+_OPENVINO_OP_REG(Divide, ov::op::v1)
+_OPENVINO_OP_REG(Elu, ov::op::v0)
+_OPENVINO_OP_REG(Erf, ov::op::v0)
+_OPENVINO_OP_REG(Equal, ov::op::v1)
+_OPENVINO_OP_REG(Exp, ov::op::v0)
+_OPENVINO_OP_REG(ExtractImagePatches, ov::op::v3)
+_OPENVINO_OP_REG(FakeQuantize, ov::op::v0)
+_OPENVINO_OP_REG(Floor, ov::op::v0)
+_OPENVINO_OP_REG(FloorMod, ov::op::v1)
+_OPENVINO_OP_REG(Gather, ov::op::v7)
+_OPENVINO_OP_REG(GatherTree, ov::op::v1)
+_OPENVINO_OP_REG(Greater, ov::op::v1)
+_OPENVINO_OP_REG(GreaterEqual, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolution, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(GRN, ov::op::v0)
+_OPENVINO_OP_REG(HardSigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Less, ov::op::v1)
+_OPENVINO_OP_REG(LessEqual, ov::op::v1)
+_OPENVINO_OP_REG(Log, ov::op::v0)
+_OPENVINO_OP_REG(LogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(LogicalNot, ov::op::v1)
+_OPENVINO_OP_REG(LogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(LogicalXor, ov::op::v1)
+_OPENVINO_OP_REG(LRN, ov::op::v0)
+_OPENVINO_OP_REG(LSTMCell, ov::op::v4)
+_OPENVINO_OP_REG(MatMul, ov::op::v0)
+_OPENVINO_OP_REG(MaxPool, ov::op::v1)
+_OPENVINO_OP_REG(Maximum, ov::op::v1)
+_OPENVINO_OP_REG(Minimum, ov::op::v1)
+_OPENVINO_OP_REG(Mod, ov::op::v1)
+_OPENVINO_OP_REG(Multiply, ov::op::v1)
+_OPENVINO_OP_REG(Negative, ov::op::v0)
+_OPENVINO_OP_REG(NormalizeL2, ov::op::v0)
+_OPENVINO_OP_REG(NotEqual, ov::op::v1)
+_OPENVINO_OP_REG(OneHot, ov::op::v1)
+_OPENVINO_OP_REG(PRelu, ov::op::v0)
+_OPENVINO_OP_REG(PSROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(Pad, ov::op::v1)
+_OPENVINO_OP_REG(Parameter, ov::op::v0)
+_OPENVINO_OP_REG(Power, ov::op::v1)
+_OPENVINO_OP_REG(PriorBox, ov::op::v0)
+_OPENVINO_OP_REG(PriorBoxClustered, ov::op::v0)
+_OPENVINO_OP_REG(Proposal, ov::op::v4)
+_OPENVINO_OP_REG(Range, ov::op::v4)
+_OPENVINO_OP_REG(Relu, ov::op::v0)
+_OPENVINO_OP_REG(ReduceMax, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMean, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMin, ov::op::v1)
+_OPENVINO_OP_REG(ReduceProd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceSum, ov::op::v1)
+_OPENVINO_OP_REG(RegionYolo, ov::op::v0)
+_OPENVINO_OP_REG(ReorgYolo, ov::op::v0)
+_OPENVINO_OP_REG(Reshape, ov::op::v1)
+_OPENVINO_OP_REG(Result, ov::op::v0)
+_OPENVINO_OP_REG(ReverseSequence, ov::op::v0)
+_OPENVINO_OP_REG(ROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(ScatterNDUpdate, ov::op::v3)
+_OPENVINO_OP_REG(Select, ov::op::v1)
+_OPENVINO_OP_REG(Selu, ov::op::v0)
+_OPENVINO_OP_REG(Sign, ov::op::v0)
+_OPENVINO_OP_REG(Sigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Sin, ov::op::v0)
+_OPENVINO_OP_REG(Sinh, ov::op::v0)
+_OPENVINO_OP_REG(Softmax, ov::op::v1)
+_OPENVINO_OP_REG(Sqrt, ov::op::v0)
+_OPENVINO_OP_REG(SpaceToDepth, ov::op::v0)
+_OPENVINO_OP_REG(Split, ov::op::v1)
+_OPENVINO_OP_REG(SquaredDifference, ov::op::v0)
+_OPENVINO_OP_REG(Squeeze, ov::op::v0)
+_OPENVINO_OP_REG(StridedSlice, ov::op::v1)
+_OPENVINO_OP_REG(Subtract, ov::op::v1)
+_OPENVINO_OP_REG(Tan, ov::op::v0)
+_OPENVINO_OP_REG(Tanh, ov::op::v0)
+_OPENVINO_OP_REG(TensorIterator, ov::op::v0)
+_OPENVINO_OP_REG(Tile, ov::op::v0)
+_OPENVINO_OP_REG(Transpose, ov::op::v1)
+_OPENVINO_OP_REG(Unsqueeze, ov::op::v0)
+_OPENVINO_OP_REG(VariadicSplit, ov::op::v1)
 
 // New operations added in opset2
-OPENVINO_OP(BatchToSpace, ov::op::v1)
-OPENVINO_OP(SpaceToBatch, ov::op::v1)
+_OPENVINO_OP_REG(BatchToSpace, ov::op::v1)
+_OPENVINO_OP_REG(SpaceToBatch, ov::op::v1)
 
 // New operations added in opset3
-OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
-OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
-OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
-OPENVINO_OP(GRUCell, ov::op::v3)
-OPENVINO_OP(NonZero, ov::op::v3)
-OPENVINO_OP(RNNCell, ov::op::v0)
-OPENVINO_OP(ROIAlign, ov::op::v3)
-OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
-OPENVINO_OP(ScatterUpdate, ov::op::v3)
-OPENVINO_OP(ShuffleChannels, ov::op::v0)
-OPENVINO_OP(ShapeOf, ov::op::v3)
-OPENVINO_OP(TopK, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagPackedSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingSegmentsSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagOffsetsSum, ov::op::v3)
+_OPENVINO_OP_REG(GRUCell, ov::op::v3)
+_OPENVINO_OP_REG(NonZero, ov::op::v3)
+_OPENVINO_OP_REG(RNNCell, ov::op::v0)
+_OPENVINO_OP_REG(ROIAlign, ov::op::v3)
+_OPENVINO_OP_REG(ScatterElementsUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ScatterUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ShuffleChannels, ov::op::v0)
+_OPENVINO_OP_REG(ShapeOf, ov::op::v3)
+_OPENVINO_OP_REG(TopK, ov::op::v3)
 
 // New operations added in opset4
-OPENVINO_OP(Acosh, ov::op::v3)
-OPENVINO_OP(Asinh, ov::op::v3)
-OPENVINO_OP(Atanh, ov::op::v3)
-OPENVINO_OP(CTCLoss, ov::op::v4)
-OPENVINO_OP(HSwish, ov::op::v4)
-OPENVINO_OP(Interpolate, ov::op::v4)
-OPENVINO_OP(Mish, ov::op::v4)
-OPENVINO_OP(ReduceL1, ov::op::v4)
-OPENVINO_OP(ReduceL2, ov::op::v4)
-OPENVINO_OP(SoftPlus, ov::op::v4)
-OPENVINO_OP(Swish, ov::op::v4)
+_OPENVINO_OP_REG(Acosh, ov::op::v3)
+_OPENVINO_OP_REG(Asinh, ov::op::v3)
+_OPENVINO_OP_REG(Atanh, ov::op::v3)
+_OPENVINO_OP_REG(CTCLoss, ov::op::v4)
+_OPENVINO_OP_REG(HSwish, ov::op::v4)
+_OPENVINO_OP_REG(Interpolate, ov::op::v4)
+_OPENVINO_OP_REG(Mish, ov::op::v4)
+_OPENVINO_OP_REG(ReduceL1, ov::op::v4)
+_OPENVINO_OP_REG(ReduceL2, ov::op::v4)
+_OPENVINO_OP_REG(SoftPlus, ov::op::v4)
+_OPENVINO_OP_REG(Swish, ov::op::v4)
 
 // New operations added in opset5
-OPENVINO_OP(GatherND, ov::op::v5)
-OPENVINO_OP(GRUSequence, ov::op::v5)
-OPENVINO_OP(HSigmoid, ov::op::v5)
-OPENVINO_OP(LogSoftmax, ov::op::v5)
-OPENVINO_OP(Loop, ov::op::v5)
-OPENVINO_OP(LSTMSequence, ov::op::v5)
-OPENVINO_OP(NonMaxSuppression, ov::op::v5)
-OPENVINO_OP(RNNSequence, ov::op::v5)
-OPENVINO_OP(Round, ov::op::v5)
+_OPENVINO_OP_REG(GatherND, ov::op::v5)
+_OPENVINO_OP_REG(GRUSequence, ov::op::v5)
+_OPENVINO_OP_REG(HSigmoid, ov::op::v5)
+_OPENVINO_OP_REG(LogSoftmax, ov::op::v5)
+_OPENVINO_OP_REG(Loop, ov::op::v5)
+_OPENVINO_OP_REG(LSTMSequence, ov::op::v5)
+_OPENVINO_OP_REG(NonMaxSuppression, ov::op::v5)
+_OPENVINO_OP_REG(RNNSequence, ov::op::v5)
+_OPENVINO_OP_REG(Round, ov::op::v5)
 
 // New operations added in opset6
-OPENVINO_OP(CTCGreedyDecoderSeqLen, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronDetectionOutput, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronGenerateProposalsSingleImage, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronPriorGridGenerator, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronROIFeatureExtractor, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronTopKROIs, ov::op::v6)
-OPENVINO_OP(GatherElements, ov::op::v6)
-OPENVINO_OP(MVN, ov::op::v6)
-OPENVINO_OP(Assign, ov::op::v6)     // new version
-OPENVINO_OP(ReadValue, ov::op::v6)  // new version
+_OPENVINO_OP_REG(CTCGreedyDecoderSeqLen, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronDetectionOutput, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronGenerateProposalsSingleImage, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronPriorGridGenerator, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronROIFeatureExtractor, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronTopKROIs, ov::op::v6)
+_OPENVINO_OP_REG(GatherElements, ov::op::v6)
+_OPENVINO_OP_REG(MVN, ov::op::v6)
+_OPENVINO_OP_REG(Assign, ov::op::v6)     // new version
+_OPENVINO_OP_REG(ReadValue, ov::op::v6)  // new version
 
 // New operations added in opset7
-OPENVINO_OP(DFT, ov::op::v7)
-OPENVINO_OP(Einsum, ov::op::v7)
-OPENVINO_OP(Gelu, ov::op::v7)
-OPENVINO_OP(IDFT, ov::op::v7)
-OPENVINO_OP(Roll, ov::op::v7)
+_OPENVINO_OP_REG(DFT, ov::op::v7)
+_OPENVINO_OP_REG(Einsum, ov::op::v7)
+_OPENVINO_OP_REG(Gelu, ov::op::v7)
+_OPENVINO_OP_REG(IDFT, ov::op::v7)
+_OPENVINO_OP_REG(Roll, ov::op::v7)
diff --git a/ngraph/core/include/openvino/opsets/opset8.hpp b/ngraph/core/include/openvino/opsets/opset8.hpp
index c41f5fb8af6..9169e3ccbbb 100644
--- a/ngraph/core/include/openvino/opsets/opset8.hpp
+++ b/ngraph/core/include/openvino/opsets/opset8.hpp
@@ -8,8 +8,8 @@
 
 namespace ov {
 namespace opset8 {
-#define OPENVINO_OP(a, b) using b::a;
+#define _OPENVINO_OP_REG(a, b) using b::a;
 #include "openvino/opsets/opset8_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
 }  // namespace opset8
 }  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset8_tbl.hpp b/ngraph/core/include/openvino/opsets/opset8_tbl.hpp
index a94b747a3b5..f7e56ae6fb5 100644
--- a/ngraph/core/include/openvino/opsets/opset8_tbl.hpp
+++ b/ngraph/core/include/openvino/opsets/opset8_tbl.hpp
@@ -2,185 +2,185 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#ifndef OPENVINO_OP
-#    warning "OPENVINO_OP not defined"
-#    define OPENVINO_OP(x, y)
+#ifndef _OPENVINO_OP_REG
+#    warning "_OPENVINO_OP_REG not defined"
+#    define _OPENVINO_OP_REG(x, y)
 #endif
 
-OPENVINO_OP(Abs, ov::op::v0)
-OPENVINO_OP(Acos, ov::op::v0)
-OPENVINO_OP(Add, ov::op::v1)
-OPENVINO_OP(Asin, ov::op::v0)
-OPENVINO_OP(Atan, ov::op::v0)
-OPENVINO_OP(AvgPool, ov::op::v1)
-OPENVINO_OP(BatchNormInference, ov::op::v5)
-OPENVINO_OP(BinaryConvolution, ov::op::v1)
-OPENVINO_OP(Broadcast, ov::op::v3)
-OPENVINO_OP(Bucketize, ov::op::v3)
-OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
-OPENVINO_OP(Ceiling, ov::op::v0)
-OPENVINO_OP(Clamp, ov::op::v0)
-OPENVINO_OP(Concat, ov::op::v0)
-OPENVINO_OP(Constant, ov::op::v0)
-OPENVINO_OP(Convert, ov::op::v0)
-OPENVINO_OP(ConvertLike, ov::op::v1)
-OPENVINO_OP(Convolution, ov::op::v1)
-OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(Cos, ov::op::v0)
-OPENVINO_OP(Cosh, ov::op::v0)
-OPENVINO_OP(CumSum, ov::op::v0)
-OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
-OPENVINO_OP(DepthToSpace, ov::op::v0)
-OPENVINO_OP(DetectionOutput, ov::op::v0)
-OPENVINO_OP(Divide, ov::op::v1)
-OPENVINO_OP(Elu, ov::op::v0)
-OPENVINO_OP(Erf, ov::op::v0)
-OPENVINO_OP(Equal, ov::op::v1)
-OPENVINO_OP(Exp, ov::op::v0)
-OPENVINO_OP(ExtractImagePatches, ov::op::v3)
-OPENVINO_OP(FakeQuantize, ov::op::v0)
-OPENVINO_OP(Floor, ov::op::v0)
-OPENVINO_OP(FloorMod, ov::op::v1)
-OPENVINO_OP(GatherTree, ov::op::v1)
-OPENVINO_OP(Greater, ov::op::v1)
-OPENVINO_OP(GreaterEqual, ov::op::v1)
-OPENVINO_OP(GroupConvolution, ov::op::v1)
-OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
-OPENVINO_OP(GRN, ov::op::v0)
-OPENVINO_OP(HardSigmoid, ov::op::v0)
-OPENVINO_OP(Less, ov::op::v1)
-OPENVINO_OP(LessEqual, ov::op::v1)
-OPENVINO_OP(Log, ov::op::v0)
-OPENVINO_OP(LogicalAnd, ov::op::v1)
-OPENVINO_OP(LogicalNot, ov::op::v1)
-OPENVINO_OP(LogicalOr, ov::op::v1)
-OPENVINO_OP(LogicalXor, ov::op::v1)
-OPENVINO_OP(LRN, ov::op::v0)
-OPENVINO_OP(LSTMCell, ov::op::v4)
-OPENVINO_OP(MatMul, ov::op::v0)
-OPENVINO_OP(Maximum, ov::op::v1)
-OPENVINO_OP(Minimum, ov::op::v1)
-OPENVINO_OP(Mod, ov::op::v1)
-OPENVINO_OP(Multiply, ov::op::v1)
-OPENVINO_OP(Negative, ov::op::v0)
-OPENVINO_OP(NormalizeL2, ov::op::v0)
-OPENVINO_OP(NotEqual, ov::op::v1)
-OPENVINO_OP(OneHot, ov::op::v1)
-OPENVINO_OP(PRelu, ov::op::v0)
-OPENVINO_OP(PSROIPooling, ov::op::v0)
-OPENVINO_OP(Pad, ov::op::v1)
-OPENVINO_OP(Parameter, ov::op::v0)
-OPENVINO_OP(Power, ov::op::v1)
-OPENVINO_OP(PriorBox, ov::op::v0)
-OPENVINO_OP(PriorBoxClustered, ov::op::v0)
-OPENVINO_OP(Proposal, ov::op::v4)
-OPENVINO_OP(Range, ov::op::v4)
-OPENVINO_OP(Relu, ov::op::v0)
-OPENVINO_OP(ReduceMax, ov::op::v1)
-OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
-OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
-OPENVINO_OP(ReduceMean, ov::op::v1)
-OPENVINO_OP(ReduceMin, ov::op::v1)
-OPENVINO_OP(ReduceProd, ov::op::v1)
-OPENVINO_OP(ReduceSum, ov::op::v1)
-OPENVINO_OP(RegionYolo, ov::op::v0)
-OPENVINO_OP(ReorgYolo, ov::op::v0)
-OPENVINO_OP(Reshape, ov::op::v1)
-OPENVINO_OP(Result, ov::op::v0)
-OPENVINO_OP(ReverseSequence, ov::op::v0)
-OPENVINO_OP(ROIPooling, ov::op::v0)
-OPENVINO_OP(ScatterNDUpdate, ov::op::v3)
-OPENVINO_OP(Select, ov::op::v1)
-OPENVINO_OP(Selu, ov::op::v0)
-OPENVINO_OP(Sign, ov::op::v0)
-OPENVINO_OP(Sigmoid, ov::op::v0)
-OPENVINO_OP(Sin, ov::op::v0)
-OPENVINO_OP(Sinh, ov::op::v0)
-OPENVINO_OP(Softmax, ov::op::v1)
-OPENVINO_OP(Sqrt, ov::op::v0)
-OPENVINO_OP(SpaceToDepth, ov::op::v0)
-OPENVINO_OP(Split, ov::op::v1)
-OPENVINO_OP(SquaredDifference, ov::op::v0)
-OPENVINO_OP(Squeeze, ov::op::v0)
-OPENVINO_OP(StridedSlice, ov::op::v1)
-OPENVINO_OP(Subtract, ov::op::v1)
-OPENVINO_OP(Tan, ov::op::v0)
-OPENVINO_OP(Tanh, ov::op::v0)
-OPENVINO_OP(TensorIterator, ov::op::v0)
-OPENVINO_OP(Tile, ov::op::v0)
-OPENVINO_OP(Transpose, ov::op::v1)
-OPENVINO_OP(Unsqueeze, ov::op::v0)
-OPENVINO_OP(VariadicSplit, ov::op::v1)
+_OPENVINO_OP_REG(Abs, ov::op::v0)
+_OPENVINO_OP_REG(Acos, ov::op::v0)
+_OPENVINO_OP_REG(Add, ov::op::v1)
+_OPENVINO_OP_REG(Asin, ov::op::v0)
+_OPENVINO_OP_REG(Atan, ov::op::v0)
+_OPENVINO_OP_REG(AvgPool, ov::op::v1)
+_OPENVINO_OP_REG(BatchNormInference, ov::op::v5)
+_OPENVINO_OP_REG(BinaryConvolution, ov::op::v1)
+_OPENVINO_OP_REG(Broadcast, ov::op::v3)
+_OPENVINO_OP_REG(Bucketize, ov::op::v3)
+_OPENVINO_OP_REG(CTCGreedyDecoder, ov::op::v0)
+_OPENVINO_OP_REG(Ceiling, ov::op::v0)
+_OPENVINO_OP_REG(Clamp, ov::op::v0)
+_OPENVINO_OP_REG(Concat, ov::op::v0)
+_OPENVINO_OP_REG(Constant, ov::op::v0)
+_OPENVINO_OP_REG(Convert, ov::op::v0)
+_OPENVINO_OP_REG(ConvertLike, ov::op::v1)
+_OPENVINO_OP_REG(Convolution, ov::op::v1)
+_OPENVINO_OP_REG(ConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(Cos, ov::op::v0)
+_OPENVINO_OP_REG(Cosh, ov::op::v0)
+_OPENVINO_OP_REG(CumSum, ov::op::v0)
+_OPENVINO_OP_REG(DeformablePSROIPooling, ov::op::v1)
+_OPENVINO_OP_REG(DepthToSpace, ov::op::v0)
+_OPENVINO_OP_REG(DetectionOutput, ov::op::v0)
+_OPENVINO_OP_REG(Divide, ov::op::v1)
+_OPENVINO_OP_REG(Elu, ov::op::v0)
+_OPENVINO_OP_REG(Erf, ov::op::v0)
+_OPENVINO_OP_REG(Equal, ov::op::v1)
+_OPENVINO_OP_REG(Exp, ov::op::v0)
+_OPENVINO_OP_REG(ExtractImagePatches, ov::op::v3)
+_OPENVINO_OP_REG(FakeQuantize, ov::op::v0)
+_OPENVINO_OP_REG(Floor, ov::op::v0)
+_OPENVINO_OP_REG(FloorMod, ov::op::v1)
+_OPENVINO_OP_REG(GatherTree, ov::op::v1)
+_OPENVINO_OP_REG(Greater, ov::op::v1)
+_OPENVINO_OP_REG(GreaterEqual, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolution, ov::op::v1)
+_OPENVINO_OP_REG(GroupConvolutionBackpropData, ov::op::v1)
+_OPENVINO_OP_REG(GRN, ov::op::v0)
+_OPENVINO_OP_REG(HardSigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Less, ov::op::v1)
+_OPENVINO_OP_REG(LessEqual, ov::op::v1)
+_OPENVINO_OP_REG(Log, ov::op::v0)
+_OPENVINO_OP_REG(LogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(LogicalNot, ov::op::v1)
+_OPENVINO_OP_REG(LogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(LogicalXor, ov::op::v1)
+_OPENVINO_OP_REG(LRN, ov::op::v0)
+_OPENVINO_OP_REG(LSTMCell, ov::op::v4)
+_OPENVINO_OP_REG(MatMul, ov::op::v0)
+_OPENVINO_OP_REG(Maximum, ov::op::v1)
+_OPENVINO_OP_REG(Minimum, ov::op::v1)
+_OPENVINO_OP_REG(Mod, ov::op::v1)
+_OPENVINO_OP_REG(Multiply, ov::op::v1)
+_OPENVINO_OP_REG(Negative, ov::op::v0)
+_OPENVINO_OP_REG(NormalizeL2, ov::op::v0)
+_OPENVINO_OP_REG(NotEqual, ov::op::v1)
+_OPENVINO_OP_REG(OneHot, ov::op::v1)
+_OPENVINO_OP_REG(PRelu, ov::op::v0)
+_OPENVINO_OP_REG(PSROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(Pad, ov::op::v1)
+_OPENVINO_OP_REG(Parameter, ov::op::v0)
+_OPENVINO_OP_REG(Power, ov::op::v1)
+_OPENVINO_OP_REG(PriorBox, ov::op::v0)
+_OPENVINO_OP_REG(PriorBoxClustered, ov::op::v0)
+_OPENVINO_OP_REG(Proposal, ov::op::v4)
+_OPENVINO_OP_REG(Range, ov::op::v4)
+_OPENVINO_OP_REG(Relu, ov::op::v0)
+_OPENVINO_OP_REG(ReduceMax, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalAnd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceLogicalOr, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMean, ov::op::v1)
+_OPENVINO_OP_REG(ReduceMin, ov::op::v1)
+_OPENVINO_OP_REG(ReduceProd, ov::op::v1)
+_OPENVINO_OP_REG(ReduceSum, ov::op::v1)
+_OPENVINO_OP_REG(RegionYolo, ov::op::v0)
+_OPENVINO_OP_REG(ReorgYolo, ov::op::v0)
+_OPENVINO_OP_REG(Reshape, ov::op::v1)
+_OPENVINO_OP_REG(Result, ov::op::v0)
+_OPENVINO_OP_REG(ReverseSequence, ov::op::v0)
+_OPENVINO_OP_REG(ROIPooling, ov::op::v0)
+_OPENVINO_OP_REG(ScatterNDUpdate, ov::op::v3)
+_OPENVINO_OP_REG(Select, ov::op::v1)
+_OPENVINO_OP_REG(Selu, ov::op::v0)
+_OPENVINO_OP_REG(Sign, ov::op::v0)
+_OPENVINO_OP_REG(Sigmoid, ov::op::v0)
+_OPENVINO_OP_REG(Sin, ov::op::v0)
+_OPENVINO_OP_REG(Sinh, ov::op::v0)
+_OPENVINO_OP_REG(Softmax, ov::op::v1)
+_OPENVINO_OP_REG(Sqrt, ov::op::v0)
+_OPENVINO_OP_REG(SpaceToDepth, ov::op::v0)
+_OPENVINO_OP_REG(Split, ov::op::v1)
+_OPENVINO_OP_REG(SquaredDifference, ov::op::v0)
+_OPENVINO_OP_REG(Squeeze, ov::op::v0)
+_OPENVINO_OP_REG(StridedSlice, ov::op::v1)
+_OPENVINO_OP_REG(Subtract, ov::op::v1)
+_OPENVINO_OP_REG(Tan, ov::op::v0)
+_OPENVINO_OP_REG(Tanh, ov::op::v0)
+_OPENVINO_OP_REG(TensorIterator, ov::op::v0)
+_OPENVINO_OP_REG(Tile, ov::op::v0)
+_OPENVINO_OP_REG(Transpose, ov::op::v1)
+_OPENVINO_OP_REG(Unsqueeze, ov::op::v0)
+_OPENVINO_OP_REG(VariadicSplit, ov::op::v1)
 
 // New operations added in opset2
-OPENVINO_OP(BatchToSpace, ov::op::v1)
-OPENVINO_OP(SpaceToBatch, ov::op::v1)
+_OPENVINO_OP_REG(BatchToSpace, ov::op::v1)
+_OPENVINO_OP_REG(SpaceToBatch, ov::op::v1)
 
 // New operations added in opset3
-OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
-OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
-OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
-OPENVINO_OP(GRUCell, ov::op::v3)
-OPENVINO_OP(NonZero, ov::op::v3)
-OPENVINO_OP(RNNCell, ov::op::v0)
-OPENVINO_OP(ROIAlign, ov::op::v3)
-OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
-OPENVINO_OP(ScatterUpdate, ov::op::v3)
-OPENVINO_OP(ShuffleChannels, ov::op::v0)
-OPENVINO_OP(ShapeOf, ov::op::v3)
-OPENVINO_OP(TopK, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagPackedSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingSegmentsSum, ov::op::v3)
+_OPENVINO_OP_REG(EmbeddingBagOffsetsSum, ov::op::v3)
+_OPENVINO_OP_REG(GRUCell, ov::op::v3)
+_OPENVINO_OP_REG(NonZero, ov::op::v3)
+_OPENVINO_OP_REG(RNNCell, ov::op::v0)
+_OPENVINO_OP_REG(ROIAlign, ov::op::v3)
+_OPENVINO_OP_REG(ScatterElementsUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ScatterUpdate, ov::op::v3)
+_OPENVINO_OP_REG(ShuffleChannels, ov::op::v0)
+_OPENVINO_OP_REG(ShapeOf, ov::op::v3)
+_OPENVINO_OP_REG(TopK, ov::op::v3)
 
 // New operations added in opset4
-OPENVINO_OP(Acosh, ov::op::v3)
-OPENVINO_OP(Asinh, ov::op::v3)
-OPENVINO_OP(Atanh, ov::op::v3)
-OPENVINO_OP(CTCLoss, ov::op::v4)
-OPENVINO_OP(HSwish, ov::op::v4)
-OPENVINO_OP(Interpolate, ov::op::v4)
-OPENVINO_OP(Mish, ov::op::v4)
-OPENVINO_OP(ReduceL1, ov::op::v4)
-OPENVINO_OP(ReduceL2, ov::op::v4)
-OPENVINO_OP(SoftPlus, ov::op::v4)
-OPENVINO_OP(Swish, ov::op::v4)
+_OPENVINO_OP_REG(Acosh, ov::op::v3)
+_OPENVINO_OP_REG(Asinh, ov::op::v3)
+_OPENVINO_OP_REG(Atanh, ov::op::v3)
+_OPENVINO_OP_REG(CTCLoss, ov::op::v4)
+_OPENVINO_OP_REG(HSwish, ov::op::v4)
+_OPENVINO_OP_REG(Interpolate, ov::op::v4)
+_OPENVINO_OP_REG(Mish, ov::op::v4)
+_OPENVINO_OP_REG(ReduceL1, ov::op::v4)
+_OPENVINO_OP_REG(ReduceL2, ov::op::v4)
+_OPENVINO_OP_REG(SoftPlus, ov::op::v4)
+_OPENVINO_OP_REG(Swish, ov::op::v4)
 
 // New operations added in opset5
-OPENVINO_OP(GatherND, ov::op::v5)
-OPENVINO_OP(GRUSequence, ov::op::v5)
-OPENVINO_OP(HSigmoid, ov::op::v5)
-OPENVINO_OP(LogSoftmax, ov::op::v5)
-OPENVINO_OP(Loop, ov::op::v5)
-OPENVINO_OP(LSTMSequence, ov::op::v5)
-OPENVINO_OP(NonMaxSuppression, ov::op::v5)
-OPENVINO_OP(RNNSequence, ov::op::v5)
-OPENVINO_OP(Round, ov::op::v5)
+_OPENVINO_OP_REG(GatherND, ov::op::v5)
+_OPENVINO_OP_REG(GRUSequence, ov::op::v5)
+_OPENVINO_OP_REG(HSigmoid, ov::op::v5)
+_OPENVINO_OP_REG(LogSoftmax, ov::op::v5)
+_OPENVINO_OP_REG(Loop, ov::op::v5)
+_OPENVINO_OP_REG(LSTMSequence, ov::op::v5)
+_OPENVINO_OP_REG(NonMaxSuppression, ov::op::v5)
+_OPENVINO_OP_REG(RNNSequence, ov::op::v5)
+_OPENVINO_OP_REG(Round, ov::op::v5)
 
 // New operations added in opset6
-OPENVINO_OP(CTCGreedyDecoderSeqLen, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronDetectionOutput, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronGenerateProposalsSingleImage, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronPriorGridGenerator, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronROIFeatureExtractor, ov::op::v6)
-OPENVINO_OP(ExperimentalDetectronTopKROIs, ov::op::v6)
-OPENVINO_OP(GatherElements, ov::op::v6)
-OPENVINO_OP(MVN, ov::op::v6)
-OPENVINO_OP(Assign, ov::op::v6)     // new version
-OPENVINO_OP(ReadValue, ov::op::v6)  // new version
+_OPENVINO_OP_REG(CTCGreedyDecoderSeqLen, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronDetectionOutput, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronGenerateProposalsSingleImage, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronPriorGridGenerator, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronROIFeatureExtractor, ov::op::v6)
+_OPENVINO_OP_REG(ExperimentalDetectronTopKROIs, ov::op::v6)
+_OPENVINO_OP_REG(GatherElements, ov::op::v6)
+_OPENVINO_OP_REG(MVN, ov::op::v6)
+_OPENVINO_OP_REG(Assign, ov::op::v6)     // new version
+_OPENVINO_OP_REG(ReadValue, ov::op::v6)  // new version
 
 // New operations added in opset7
-OPENVINO_OP(DFT, ov::op::v7)
-OPENVINO_OP(Einsum, ov::op::v7)
-OPENVINO_OP(Gelu, ov::op::v7)
-OPENVINO_OP(IDFT, ov::op::v7)
-OPENVINO_OP(Roll, ov::op::v7)
+_OPENVINO_OP_REG(DFT, ov::op::v7)
+_OPENVINO_OP_REG(Einsum, ov::op::v7)
+_OPENVINO_OP_REG(Gelu, ov::op::v7)
+_OPENVINO_OP_REG(IDFT, ov::op::v7)
+_OPENVINO_OP_REG(Roll, ov::op::v7)
 
 // New operations added in opset8
-OPENVINO_OP(Gather, ov::op::v8)
-OPENVINO_OP(AdaptiveAvgPool, ov::op::v8)
-OPENVINO_OP(AdaptiveMaxPool, ov::op::v8)
-OPENVINO_OP(DeformableConvolution, ov::op::v8)
-OPENVINO_OP(MatrixNms, ov::op::v8)
-OPENVINO_OP(MaxPool, ov::op::v8)
-OPENVINO_OP(MulticlassNms, ov::op::v8)
-OPENVINO_OP(RandomUniform, ov::op::v8)
-OPENVINO_OP(Slice, ov::op::v8)
-OPENVINO_OP(If, ov::op::v8)
+_OPENVINO_OP_REG(Gather, ov::op::v8)
+_OPENVINO_OP_REG(AdaptiveAvgPool, ov::op::v8)
+_OPENVINO_OP_REG(AdaptiveMaxPool, ov::op::v8)
+_OPENVINO_OP_REG(DeformableConvolution, ov::op::v8)
+_OPENVINO_OP_REG(MatrixNms, ov::op::v8)
+_OPENVINO_OP_REG(MaxPool, ov::op::v8)
+_OPENVINO_OP_REG(MulticlassNms, ov::op::v8)
+_OPENVINO_OP_REG(RandomUniform, ov::op::v8)
+_OPENVINO_OP_REG(Slice, ov::op::v8)
+_OPENVINO_OP_REG(If, ov::op::v8)
diff --git a/ngraph/core/src/env_util.cpp b/ngraph/core/src/env_util.cpp
index 7a561524f7f..eaa6f675e97 100644
--- a/ngraph/core/src/env_util.cpp
+++ b/ngraph/core/src/env_util.cpp
@@ -8,59 +8,18 @@
 
 #include "ngraph/log.hpp"
 #include "ngraph/util.hpp"
+#include "openvino/util/env_util.hpp"
 
 using namespace std;
 
 std::string ngraph::getenv_string(const char* env_var) {
-    const char* env_p = ::getenv(env_var);
-    return env_p != nullptr ? string(env_p) : "";
+    return ov::util::getenv_string(env_var);
 }
 
 int32_t ngraph::getenv_int(const char* env_var, int32_t default_value) {
-    const char* env_p = ::getenv(env_var);
-    int32_t env = default_value;
-    // If env_var is not "" or undefined
-    if (env_p && *env_p) {
-        errno = 0;
-        char* err;
-        env = strtol(env_p, &err, 0);
-        // if conversion leads to an overflow
-        if (errno) {
-            std::stringstream ss;
-            ss << "Environment variable \"" << env_var << "\"=\"" << env_p << "\" converted to different value \""
-               << env << "\" due to overflow." << std::endl;
-            throw runtime_error(ss.str());
-        }
-        // if syntax error is there - conversion will still happen
-        // but warn user of syntax error
-        if (*err) {
-            std::stringstream ss;
-            ss << "Environment variable \"" << env_var << "\"=\"" << env_p << "\" converted to different value \""
-               << env << "\" due to syntax error \"" << err << '\"' << std::endl;
-            throw runtime_error(ss.str());
-        }
-    } else {
-        NGRAPH_DEBUG << "Environment variable (" << env_var << ") empty or undefined, "
-                     << " defaulted to " << default_value << " here.";
-    }
-    return env;
+    return ov::util::getenv_int(env_var, default_value);
 }
 
 bool ngraph::getenv_bool(const char* env_var, bool default_value) {
-    string value = to_lower(getenv_string(env_var));
-    set<string> off = {"0", "false", "off"};
-    set<string> on = {"1", "true", "on"};
-    bool rc;
-    if (value == "") {
-        rc = default_value;
-    } else if (off.find(value) != off.end()) {
-        rc = false;
-    } else if (on.find(value) != on.end()) {
-        rc = true;
-    } else {
-        stringstream ss;
-        ss << "environment variable '" << env_var << "' value '" << value << "' invalid. Must be boolean.";
-        throw runtime_error(ss.str());
-    }
-    return rc;
+    return ov::util::getenv_bool(env_var, default_value);
 }
diff --git a/ngraph/core/src/file_util.cpp b/ngraph/core/src/file_util.cpp
index 827226d5345..d54db2bd201 100644
--- a/ngraph/core/src/file_util.cpp
+++ b/ngraph/core/src/file_util.cpp
@@ -2,45 +2,9 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#ifdef _WIN32
-#    ifndef NOMINMAX
-#        define NOMINMAX
-#    endif
-#    include <windows.h>
-#else
-#    include <dirent.h>
-#    include <ftw.h>
-#    include <sys/file.h>
-#    include <sys/time.h>
-#    include <unistd.h>
-#endif
-#include <fcntl.h>
-#include <string.h>
-#include <sys/stat.h>
-#include <sys/types.h>
-
-#include <algorithm>
-#include <fstream>
-#include <iostream>
-#include <sstream>
-#include <stdexcept>
-#include <vector>
-
-#include "ngraph/env_util.hpp"
 #include "ngraph/file_util.hpp"
-#include "ngraph/log.hpp"
 
-#ifdef _WIN32
-#    define RMDIR(a)  RemoveDirectoryA(a)
-#    define RMFILE(a) DeleteFileA(a)
-#else
-#    define RMDIR(a)  rmdir(a)
-#    define RMFILE(a) remove(a)
-#    ifdef ENABLE_UNICODE_PATH_SUPPORT
-#        include <codecvt>
-#        include <locale>
-#    endif
-#endif
+#include "openvino/util/file_util.hpp"
 
 NGRAPH_SUPPRESS_DEPRECATED_START
 
@@ -48,202 +12,51 @@ using namespace std;
 using namespace ngraph;
 
 string file_util::get_file_name(const string& s) {
-    string rc = s;
-    auto pos = s.find_last_of('/');
-    if (pos != string::npos) {
-        rc = s.substr(pos + 1);
-    }
-    return rc;
+    return ov::util::get_file_name(s);
 }
 
 string file_util::get_file_ext(const string& s) {
-    string rc = get_file_name(s);
-    auto pos = rc.find_last_of('.');
-    if (pos != string::npos) {
-        rc = rc.substr(pos);
-    } else {
-        rc = "";
-    }
-    return rc;
+    return ov::util::get_file_ext(s);
 }
 
 string file_util::get_directory(const string& s) {
-    string rc = s;
-    // Linux-style separator
-    auto pos = s.find_last_of('/');
-    if (pos != string::npos) {
-        rc = s.substr(0, pos);
-        return rc;
-    }
-    // Windows-style separator
-    pos = s.find_last_of('\\');
-    if (pos != string::npos) {
-        rc = s.substr(0, pos);
-        return rc;
-    }
-    return rc;
+    return ov::util::get_directory(s);
 }
 
 string file_util::path_join(const string& s1, const string& s2, const string& s3) {
-    return path_join(path_join(s1, s2), s3);
+    return ov::util::path_join({s1, s2, s3});
 }
 
 string file_util::path_join(const string& s1, const string& s2, const string& s3, const string& s4) {
-    return path_join(path_join(path_join(s1, s2), s3), s4);
+    return ov::util::path_join({s1, s2, s3, s4});
 }
 
 string file_util::path_join(const string& s1, const string& s2) {
-    string rc;
-    if (s2.size() > 0) {
-        if (s2[0] == '/') {
-            rc = s2;
-        } else if (s1.size() > 0) {
-            rc = s1;
-            if (rc[rc.size() - 1] != '/') {
-                rc += "/";
-            }
-            rc += s2;
-        } else {
-            rc = s2;
-        }
-    } else {
-        rc = s1;
-    }
-    return rc;
+    return ov::util::path_join({s1, s2});
 }
 
-#ifndef _WIN32
-static void iterate_files_worker(const string& path,
-                                 function<void(const string& file, bool is_dir)> func,
-                                 bool recurse,
-                                 bool include_links) {
-    DIR* dir;
-    struct dirent* ent;
-    if ((dir = opendir(path.c_str())) != nullptr) {
-        try {
-            while ((ent = readdir(dir)) != nullptr) {
-                string name = ent->d_name;
-                string path_name = file_util::path_join(path, name);
-                switch (ent->d_type) {
-                case DT_DIR:
-                    if (name != "." && name != "..") {
-                        if (recurse) {
-                            file_util::iterate_files(path_name, func, recurse);
-                        }
-                        func(path_name, true);
-                    }
-                    break;
-                case DT_LNK:
-                    if (include_links) {
-                        func(path_name, false);
-                    }
-                    break;
-                case DT_REG:
-                    func(path_name, false);
-                    break;
-                default:
-                    break;
-                }
-            }
-        } catch (...) {
-            exception_ptr p = current_exception();
-            closedir(dir);
-            rethrow_exception(p);
-        }
-        closedir(dir);
-    } else {
-        throw runtime_error("error enumerating file " + path);
-    }
-}
-#endif
-
 void file_util::iterate_files(const string& path,
                               function<void(const string& file, bool is_dir)> func,
                               bool recurse,
                               bool include_links) {
-    vector<string> files;
-    vector<string> dirs;
-#ifdef _WIN32
-    std::string file_match = path_join(path, "*");
-    WIN32_FIND_DATAA data;
-    HANDLE hFind = FindFirstFileA(file_match.c_str(), &data);
-    if (hFind != INVALID_HANDLE_VALUE) {
-        do {
-            bool is_dir = data.dwFileAttributes == FILE_ATTRIBUTE_DIRECTORY;
-            if (is_dir) {
-                if (string(data.cFileName) != "." && string(data.cFileName) != "..") {
-                    string dir_path = path_join(path, data.cFileName);
-                    if (recurse) {
-                        iterate_files(dir_path, func, recurse);
-                    }
-                    func(dir_path, true);
-                }
-            } else {
-                string file_name = path_join(path, data.cFileName);
-                func(file_name, false);
-            }
-        } while (FindNextFileA(hFind, &data));
-        FindClose(hFind);
-    }
-#else
-    iterate_files_worker(
-        path,
-        [&files, &dirs](const string& file, bool is_dir) {
-            if (is_dir) {
-                dirs.push_back(file);
-            } else {
-                files.push_back(file);
-            }
-        },
-        recurse,
-        include_links);
-#endif
-
-    for (auto f : files) {
-        func(f, false);
-    }
-    for (auto f : dirs) {
-        func(f, true);
-    }
+    return ov::util::iterate_files(path, func, recurse, include_links);
 }
 
 std::string file_util::sanitize_path(const std::string& path) {
-    const auto colon_pos = path.find(":");
-    const auto sanitized_path = path.substr(colon_pos == std::string::npos ? 0 : colon_pos + 1);
-    const std::string to_erase = "/.\\";
-    const auto start = sanitized_path.find_first_not_of(to_erase);
-    return (start == std::string::npos) ? "" : sanitized_path.substr(start);
+    return ov::util::sanitize_path(path);
 }
 
-NGRAPH_API void file_util::convert_path_win_style(std::string& path) {
-    std::replace(path.begin(), path.end(), '/', '\\');
+void file_util::convert_path_win_style(std::string& path) {
+    ov::util::convert_path_win_style(path);
 }
 
 #ifdef ENABLE_UNICODE_PATH_SUPPORT
 
 std::string file_util::wstring_to_string(const std::wstring& wstr) {
-#    ifdef _WIN32
-    int size_needed = WideCharToMultiByte(CP_UTF8, 0, &wstr[0], (int)wstr.size(), NULL, 0, NULL, NULL);  // NOLINT
-    std::string strTo(size_needed, 0);
-    WideCharToMultiByte(CP_UTF8, 0, &wstr[0], (int)wstr.size(), &strTo[0], size_needed, NULL, NULL);  // NOLINT
-    return strTo;
-#    else
-    std::wstring_convert<std::codecvt_utf8<wchar_t>> wstring_decoder;
-    return wstring_decoder.to_bytes(wstr);
-#    endif
+    return ov::util::wstring_to_string(wstr);
 }
 
 std::wstring file_util::multi_byte_char_to_wstring(const char* str) {
-#    ifdef _WIN32
-    int strSize = static_cast<int>(std::strlen(str));
-    int size_needed = MultiByteToWideChar(CP_UTF8, 0, str, strSize, NULL, 0);
-    std::wstring wstrTo(size_needed, 0);
-    MultiByteToWideChar(CP_UTF8, 0, str, strSize, &wstrTo[0], size_needed);
-    return wstrTo;
-#    else
-    std::wstring_convert<std::codecvt_utf8<wchar_t>> wstring_encoder;
-    std::wstring result = wstring_encoder.from_bytes(str);
-    return result;
-#    endif
+    return ov::util::string_to_wstring(str);
 }
 #endif  // ENABLE_UNICODE_PATH_SUPPORT
diff --git a/ngraph/core/src/graph_util.cpp b/ngraph/core/src/graph_util.cpp
index eeaa7946206..a6436d1f8f2 100644
--- a/ngraph/core/src/graph_util.cpp
+++ b/ngraph/core/src/graph_util.cpp
@@ -7,6 +7,7 @@
 #include <numeric>
 #include <unordered_map>
 #include <unordered_set>
+#include <utility>
 #include <vector>
 
 #include "ngraph/descriptor/input.hpp"
@@ -33,30 +34,31 @@ using namespace ngraph;
 
 NGRAPH_SUPPRESS_DEPRECATED_START
 
-void ngraph::traverse_nodes(const std::shared_ptr<const Function> p, std::function<void(std::shared_ptr<Node>)> f) {
+void ov::traverse_nodes(const std::shared_ptr<const Function>& p,
+                        const std::function<void(const std::shared_ptr<Node>&)>& f) {
     traverse_nodes(p.get(), f);
 }
 
-void ngraph::traverse_nodes(const Function* p, std::function<void(std::shared_ptr<Node>)> f) {
+void ov::traverse_nodes(const Function* p, const std::function<void(const std::shared_ptr<Node>&)>& f) {
     NodeVector nodes;
 
-    for (auto r : p->get_results()) {
+    for (const auto& r : p->get_results()) {
         nodes.push_back(r);
     }
     for (auto s : p->get_sinks()) {
         nodes.emplace_back(s);
     }
 
-    for (auto param : p->get_parameters()) {
+    for (const auto& param : p->get_parameters()) {
         nodes.push_back(param);
     }
 
     traverse_nodes(nodes, f);
 }
 
-void ngraph::traverse_nodes(const NodeVector& subgraph_results,
-                            std::function<void(std::shared_ptr<Node>)> f,
-                            const NodeVector& subgraph_params) {
+void ov::traverse_nodes(const NodeVector& subgraph_results,
+                        const std::function<void(const std::shared_ptr<Node>&)>& f,
+                        const NodeVector& subgraph_params) {
     std::unordered_set<Node*> instances_seen;
     std::stack<Node*, std::vector<Node*>> stack;
     for (auto& node_ptr : subgraph_params) {
@@ -85,19 +87,19 @@ void ngraph::traverse_nodes(const NodeVector& subgraph_results,
 NodeVector ngraph::find_common_args(std::shared_ptr<Node> node1, std::shared_ptr<Node> node2) {
     std::unordered_set<std::shared_ptr<Node>> node1_args;
 
-    auto compute_node1_args = [&node1_args](const std::shared_ptr<Node> node) {
+    auto compute_node1_args = [&node1_args](const std::shared_ptr<Node>& node) {
         node1_args.insert(node);
     };
 
-    traverse_nodes({node1}, compute_node1_args, NodeVector{});
+    traverse_nodes({std::move(node1)}, compute_node1_args, NodeVector{});
 
     std::unordered_set<std::shared_ptr<Node>> node2_args;
 
-    auto compute_node2_args = [&node2_args](const std::shared_ptr<Node> node) {
+    auto compute_node2_args = [&node2_args](const std::shared_ptr<Node>& node) {
         node2_args.insert(node);
     };
 
-    traverse_nodes({node2}, compute_node2_args, NodeVector{});
+    traverse_nodes({std::move(node2)}, compute_node2_args, NodeVector{});
 
     NodeVector common_args;
     for (const auto& e : node1_args) {
@@ -109,9 +111,9 @@ NodeVector ngraph::find_common_args(std::shared_ptr<Node> node1, std::shared_ptr
     return common_args;
 }
 
-void ngraph::replace_node(std::shared_ptr<Node> target,
-                          std::shared_ptr<Node> replacement,
-                          const std::vector<int64_t>& output_order) {
+void ov::replace_node(const std::shared_ptr<Node>& target,
+                      const std::shared_ptr<Node>& replacement,
+                      const std::vector<int64_t>& output_order) {
     if (ngraph::op::is_output(target)) {
         throw ngraph_error("Result nodes cannot be replaced.");
     }
@@ -130,8 +132,8 @@ void ngraph::replace_node(std::shared_ptr<Node> target,
 
         std::set<string> removed_subgraph_tags;
 
-        auto set_replacement_prov = [&removed_subgraph_tags](std::shared_ptr<Node> node) {
-            for (auto tag : node->get_provenance_tags()) {
+        auto set_replacement_prov = [&removed_subgraph_tags](const std::shared_ptr<Node>& node) {
+            for (const auto& tag : node->get_provenance_tags()) {
                 removed_subgraph_tags.insert(tag);
             }
         };
@@ -139,7 +141,7 @@ void ngraph::replace_node(std::shared_ptr<Node> target,
         traverse_nodes({target}, set_replacement_prov, common_args);
         replacement->add_provenance_tags(removed_subgraph_tags);
 
-        auto set_prov_new_nodes = [&removed_subgraph_tags](std::shared_ptr<Node> node) {
+        auto set_prov_new_nodes = [&removed_subgraph_tags](const std::shared_ptr<Node>& node) {
             node->add_provenance_tags(removed_subgraph_tags);
         };
 
@@ -158,7 +160,7 @@ void ngraph::replace_node(std::shared_ptr<Node> target,
     target->clear_control_dependents();
 }
 
-void ngraph::replace_node(const std::shared_ptr<Node>& target, const OutputVector& replacement_values) {
+void ov::replace_node(const std::shared_ptr<Node>& target, const OutputVector& replacement_values) {
     if (ngraph::op::is_output(target)) {
         throw ngraph_error("Result nodes cannot be replaced.");
     }
@@ -183,16 +185,16 @@ void ngraph::replace_node(const std::shared_ptr<Node>& target, const OutputVecto
     target->clear_control_dependents();
 }
 
-void ngraph::replace_node(std::shared_ptr<Node> target, std::shared_ptr<Node> replacement) {
+void ov::replace_node(const std::shared_ptr<Node>& target, const std::shared_ptr<Node>& replacement) {
     auto default_output_order = vector<int64_t>(target->get_output_size());
     std::iota(default_output_order.begin(), default_output_order.end(), 0);
     replace_node(target, replacement, default_output_order);
 }
 
-void ngraph::replace_nodes(
-    const std::shared_ptr<Function>& f,
-    const unordered_map<shared_ptr<op::Parameter>, shared_ptr<op::Parameter>>& parameter_replacement_map,
-    const unordered_map<shared_ptr<Node>, shared_ptr<Node>>& body_replacement_map) {
+void ov::replace_nodes(const std::shared_ptr<Function>& f,
+                       const unordered_map<shared_ptr<ov::op::v0::Parameter>, shared_ptr<ov::op::v0::Parameter>>&
+                           parameter_replacement_map,
+                       const unordered_map<shared_ptr<Node>, shared_ptr<Node>>& body_replacement_map) {
     auto& params = f->get_parameters();
 
     for (size_t i = 0; i < params.size(); i++) {
@@ -239,7 +241,7 @@ std::vector<std::shared_ptr<ngraph::Node>> ngraph::clone_nodes(const std::vector
                                                                NodeMap& node_map) {
     // for each node in topological order
     auto sorted_nodes = topological_sort(nodes);
-    for (auto node : sorted_nodes) {
+    for (const auto& node : sorted_nodes) {
         if (node_map.count(node.get()) == 0) {
             // get (already) cloned arguments and clone the node
             OutputVector cloned_args;
@@ -267,7 +269,7 @@ std::vector<std::shared_ptr<ngraph::Node>> ngraph::clone_nodes(const std::vector
                 new_output.get_rt_info() = output_rt_info;
             }
 
-            for (auto tag : node->get_provenance_tags()) {
+            for (const auto& tag : node->get_provenance_tags()) {
                 cloned_node->add_provenance_tag(tag);
             }
             cloned_node->set_op_annotations(node->get_op_annotations());
@@ -279,7 +281,7 @@ std::vector<std::shared_ptr<ngraph::Node>> ngraph::clone_nodes(const std::vector
     // create and return vector of cloned nodes
     // order matches input vector (not necessarily topological)
     std::vector<std::shared_ptr<ngraph::Node>> cloned_nodes;
-    for (auto node : nodes) {
+    for (const auto& node : nodes) {
         cloned_nodes.push_back(node_map.at(node.get()));
     }
     return cloned_nodes;
@@ -290,19 +292,19 @@ std::list<std::shared_ptr<ngraph::Node>> ngraph::clone_nodes(const std::vector<s
     // for each node in topological order
     auto sorted_nodes = topological_sort(nodes);
     std::list<shared_ptr<Node>> cloned_nodes;
-    for (auto node : sorted_nodes) {
+    for (const auto& node : sorted_nodes) {
         auto node_outputs = node->outputs();
-        for (auto value : node_outputs) {
+        for (const auto& value : node_outputs) {
             if (output_map.count(value) == 0) {
                 // We need this node cloned
                 // get (already) cloned arguments and clone the node
                 OutputVector cloned_args;
-                for (auto value : node->input_values()) {
+                for (const auto& value : node->input_values()) {
                     cloned_args.push_back(output_map.at(value));
                 }
                 NodeVector cloned_dependencies;
                 for (auto& dependency : node->get_control_dependencies()) {
-                    for (auto dependency_value : dependency->outputs()) {
+                    for (const auto& dependency_value : dependency->outputs()) {
                         shared_ptr<Node> dependent = output_map.at(dependency_value).get_node_shared_ptr();
                         if (find(cloned_dependencies.begin(), cloned_dependencies.end(), dependent) ==
                             cloned_dependencies.end()) {
@@ -317,11 +319,11 @@ std::list<std::shared_ptr<ngraph::Node>> ngraph::clone_nodes(const std::vector<s
                 auto rt_info = node->get_rt_info();
                 cloned_node->get_rt_info() = rt_info;
 
-                for (auto tag : node->get_provenance_tags()) {
+                for (const auto& tag : node->get_provenance_tags()) {
                     cloned_node->add_provenance_tag(tag);
                 }
                 cloned_node->set_op_annotations(node->get_op_annotations());
-                for (auto cloned_value : cloned_node->outputs()) {
+                for (const auto& cloned_value : cloned_node->outputs()) {
                     auto original_value = node_outputs.at(cloned_value.get_index());
                     if (output_map.count(original_value) == 0) {
                         output_map[original_value] = cloned_value;
@@ -334,12 +336,12 @@ std::list<std::shared_ptr<ngraph::Node>> ngraph::clone_nodes(const std::vector<s
     return cloned_nodes;
 }
 
-std::shared_ptr<ngraph::Function> ngraph::clone_function(const ngraph::Function& func) {
+std::shared_ptr<ngraph::Function> ov::clone_function(const ngraph::Function& func) {
     NodeMap nm;
     return clone_function(func, nm);
 }
 
-std::shared_ptr<ngraph::Function> ngraph::clone_function(const ngraph::Function& func, NodeMap& node_map) {
+std::shared_ptr<ngraph::Function> ov::clone_function(const ngraph::Function& func, NodeMap& node_map) {
     // clone function operations
     clone_nodes(func.get_ops(), node_map);
 
@@ -365,7 +367,7 @@ std::shared_ptr<ngraph::Function> ngraph::clone_function(const ngraph::Function&
     // get cloned function results and sinks and parameters
     ResultVector cloned_results;
     for (shared_ptr<Node> node : func.get_results()) {
-        auto result = ov::as_type_ptr<op::Result>(node_map.at(node.get()));
+        auto result = ov::as_type_ptr<op::v0::Result>(node_map.at(node.get()));
         if (!result) {
             throw ngraph_error("Results should be of type op::Result");
         }
@@ -376,9 +378,9 @@ std::shared_ptr<ngraph::Function> ngraph::clone_function(const ngraph::Function&
         cloned_sinks.push_back(static_pointer_cast<op::Sink>(node_map.at(node.get())));
     }
 
-    std::vector<std::shared_ptr<op::Parameter>> cloned_params;
+    std::vector<std::shared_ptr<op::v0::Parameter>> cloned_params;
     for (const auto& param : func.get_parameters()) {
-        cloned_params.push_back(ov::as_type_ptr<op::Parameter>(node_map.at(param.get())));
+        cloned_params.push_back(ov::as_type_ptr<op::v0::Parameter>(node_map.at(param.get())));
     }
 
     // create and return cloned function
@@ -543,7 +545,7 @@ NodeVector ngraph::get_subgraph_outputs(const NodeVector& nodes,
 
     NodeVector outputs;
 
-    for (auto n : nodes) {
+    for (const auto& n : nodes) {
         if (exclusions_set.count(n) != 0) {
             continue;
         }
@@ -564,7 +566,7 @@ NodeVector ngraph::extract_subgraph(const NodeVector& results, const NodeVector&
     NodeVector subgraph;
     traverse_nodes(
         results,
-        [&](std::shared_ptr<Node> n) {
+        [&](const std::shared_ptr<Node>& n) {
             subgraph.push_back(n);
         },
         args);
@@ -636,13 +638,13 @@ bool ngraph::is_valid_rank(const std::shared_ptr<Node>& node, std::vector<size_t
     return false;
 }
 
-bool ngraph::compare_constants(const std::shared_ptr<Node>& n1, const std::shared_ptr<Node>& n2) {
-    if (!(op::is_constant(n1) && op::is_constant(n2))) {
+bool ov::compare_constants(const std::shared_ptr<Node>& n1, const std::shared_ptr<Node>& n2) {
+    if (!(op::util::is_constant(n1) && op::util::is_constant(n2))) {
         return false;
     }
 
-    if (static_pointer_cast<op::Constant>(n1)->get_value_strings() !=
-        static_pointer_cast<op::Constant>(n2)->get_value_strings()) {
+    if (static_pointer_cast<op::v0::Constant>(n1)->get_value_strings() !=
+        static_pointer_cast<op::v0::Constant>(n2)->get_value_strings()) {
         return false;
     }
 
@@ -654,7 +656,7 @@ void ngraph::plot_graph(std::shared_ptr<Function> f,
                         std::function<void(const Node& node, std::vector<std::string>& attributes)> attributes) {
     ngraph::pass::Manager pass_manager;
     pass_manager.register_pass<ngraph::pass::VisualizeTree>(filename, attributes);
-    pass_manager.run_passes(f);
+    pass_manager.run_passes(std::move(f));
 }
 
 std::vector<Input<Node>> ngraph::get_inputs_from(Node& src, Node& dst) {
@@ -690,7 +692,7 @@ std::vector<Output<Node>> ngraph::get_outputs_to(Node& src, Node& dst) {
     return result;
 }
 
-static bool check_for_cycles_bkwd(std::shared_ptr<ngraph::Node> node,
+static bool check_for_cycles_bkwd(const std::shared_ptr<ngraph::Node>& node,
                                   std::deque<std::shared_ptr<ngraph::Node>>& path,
                                   std::unordered_set<std::shared_ptr<ngraph::Node>>& path_set,
                                   ngraph::NodeVector& cycle_nodes) {
@@ -699,7 +701,7 @@ static bool check_for_cycles_bkwd(std::shared_ptr<ngraph::Node> node,
     for (size_t i = 0; i < node->inputs().size(); i++) {
         auto arg = node->get_input_node_shared_ptr(i);
         if (path_set.find(arg) != path_set.end()) {
-            for (auto it : path) {
+            for (const auto& it : path) {
                 cycle_nodes.push_back(it);
             }
             // last node
@@ -715,7 +717,7 @@ static bool check_for_cycles_bkwd(std::shared_ptr<ngraph::Node> node,
     return false;
 }
 
-static bool check_for_cycles_fwd(std::shared_ptr<ngraph::Node> node,
+static bool check_for_cycles_fwd(const std::shared_ptr<ngraph::Node>& node,
                                  std::deque<std::shared_ptr<ngraph::Node>>& path,
                                  std::unordered_set<std::shared_ptr<ngraph::Node>>& path_set,
                                  ngraph::NodeVector& cycle_nodes) {
@@ -723,7 +725,7 @@ static bool check_for_cycles_fwd(std::shared_ptr<ngraph::Node> node,
     path_set.insert(node);
     for (auto& arg : node->get_users()) {
         if (path_set.find(arg) != path_set.end()) {
-            for (auto it : path) {
+            for (const auto& it : path) {
                 cycle_nodes.push_back(it);
             }
             // last node
@@ -740,7 +742,7 @@ static bool check_for_cycles_fwd(std::shared_ptr<ngraph::Node> node,
 }
 
 bool ngraph::check_for_cycles(const ngraph::Function* func, ngraph::NodeVector& cycle_nodes, bool& is_bkwd_cycle) {
-    for (auto res : func->get_results()) {
+    for (const auto& res : func->get_results()) {
         std::deque<std::shared_ptr<Node>> path;
         // mirror of path stack for faster cycle check
         std::unordered_set<std::shared_ptr<Node>> path_set;
@@ -750,7 +752,7 @@ bool ngraph::check_for_cycles(const ngraph::Function* func, ngraph::NodeVector&
         }
     }
 
-    for (auto res : func->get_sinks()) {
+    for (const auto& res : func->get_sinks()) {
         std::deque<std::shared_ptr<Node>> path;
         // mirror of path stack for faster cycle check
         std::unordered_set<std::shared_ptr<Node>> path_set;
@@ -760,7 +762,7 @@ bool ngraph::check_for_cycles(const ngraph::Function* func, ngraph::NodeVector&
         }
     }
 
-    for (auto param : func->get_parameters()) {
+    for (const auto& param : func->get_parameters()) {
         std::deque<std::shared_ptr<Node>> path;
         // mirror of path stack for faster cycle check
         std::unordered_set<std::shared_ptr<Node>> path_set;
@@ -773,10 +775,10 @@ bool ngraph::check_for_cycles(const ngraph::Function* func, ngraph::NodeVector&
     return false;
 }
 
-bool ngraph::replace_output_update_name(Output<Node> output, const Output<Node>& replacement) {
+bool ov::replace_output_update_name(Output<Node> output, const Output<Node>& replacement) {
     bool has_result_output = false;
     for (auto& target_input : output.get_target_inputs()) {
-        if (ov::is_type<op::Result>(target_input.get_node())) {
+        if (ov::is_type<op::v0::Result>(target_input.get_node())) {
             // ignore trivial elimination
             has_result_output = true;
             if (ov::is_type<ngraph::op::Parameter>(replacement.get_node())) {
@@ -807,10 +809,10 @@ bool ngraph::replace_output_update_name(Output<Node> output, const Output<Node>&
     return false;
 }
 
-bool ngraph::replace_node_update_name(std::shared_ptr<Node> target, std::shared_ptr<Node> replacement) {
+bool ov::replace_node_update_name(const std::shared_ptr<Node>& target, const std::shared_ptr<Node>& replacement) {
     for (auto& output : target->output(0).get_target_inputs()) {
         if (ov::as_type<ngraph::op::Parameter>(replacement->input_value(0).get_node()) &&
-            ov::as_type<op::Result>(output.get_node())) {
+            ov::as_type<op::v0::Result>(output.get_node())) {
             return false;
         }
     }
diff --git a/ngraph/core/src/layout.cpp b/ngraph/core/src/layout.cpp
index 0f1ca412bfe..7db3bcae0ae 100644
--- a/ngraph/core/src/layout.cpp
+++ b/ngraph/core/src/layout.cpp
@@ -5,6 +5,7 @@
 #include "openvino/core/layout.hpp"
 
 #include <algorithm>
+#include <cctype>
 
 #include "ngraph/except.hpp"
 #include "ngraph/util.hpp"
diff --git a/ngraph/core/src/node.cpp b/ngraph/core/src/node.cpp
index 60cc0f7ccc8..28346ff5e58 100644
--- a/ngraph/core/src/node.cpp
+++ b/ngraph/core/src/node.cpp
@@ -155,12 +155,13 @@ void ov::Node::set_arguments(const NodeVector& arguments) {
 }
 
 void ov::Node::set_arguments(const OutputVector& arguments) {
+    // Remove existing inputs of this node
+    m_inputs.clear();
+
     // Add this node as a user of each argument.
     size_t i = 0;
     for (auto& output : arguments) {
-        auto output_node = output.get_node();
-        auto& output_descriptor = output_node->m_outputs.at(output.get_index());
-        m_inputs.emplace_back(this, i++, output_descriptor);
+        set_argument(i++, output);
     }
 }
 
@@ -238,7 +239,9 @@ const std::string& ov::Node::get_friendly_name() const {
 
 const std::string& ov::Node::get_name() const {
     if (m_unique_name.empty()) {
-        const_cast<Node*>(this)->m_unique_name = description() + "_" + to_string(m_instance_id);
+        std::lock_guard<std::mutex> lock(m_mutex);
+        if (m_unique_name.empty())
+            const_cast<Node*>(this)->m_unique_name = description() + "_" + to_string(m_instance_id);
     }
     return m_unique_name;
 }
@@ -834,7 +837,7 @@ bool ov::Node::constant_fold(OutputVector& output_values, const OutputVector& in
 }
 
 namespace ov {
-constexpr DiscreteTypeInfo AttributeAdapter<shared_ptr<Node>>::type_info;
+BWDCMP_RTTI_DEFINITION(AttributeAdapter<shared_ptr<Node>>);
 
 AttributeAdapter<std::shared_ptr<Node>>::AttributeAdapter(std::shared_ptr<Node>& value) : m_ref(value) {}
 
@@ -848,7 +851,7 @@ bool AttributeAdapter<std::shared_ptr<Node>>::visit_attributes(AttributeVisitor&
     return true;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<NodeVector>::type_info;
+BWDCMP_RTTI_DEFINITION(AttributeAdapter<NodeVector>);
 
 AttributeAdapter<NodeVector>::AttributeAdapter(NodeVector& ref) : m_ref(ref) {}
 
diff --git a/ngraph/core/src/op/experimental_detectron_prior_grid_generator.cpp b/ngraph/core/src/op/experimental_detectron_prior_grid_generator.cpp
index 37dad95ea70..54e04bc18d8 100644
--- a/ngraph/core/src/op/experimental_detectron_prior_grid_generator.cpp
+++ b/ngraph/core/src/op/experimental_detectron_prior_grid_generator.cpp
@@ -60,10 +60,12 @@ void op::v6::ExperimentalDetectronPriorGridGenerator::validate() {
 
     NODE_VALIDATION_CHECK(this, priors_shape.rank().get_length() == 2, "Priors rank must be equal to 2.");
 
-    NODE_VALIDATION_CHECK(this,
-                          priors_shape[1].is_static() && priors_shape[1].get_length() == 4u,
-                          "The last dimension of the 'priors' input must be equal to 4. Got: ",
-                          priors_shape[1]);
+    if (priors_shape[1].is_static()) {
+        NODE_VALIDATION_CHECK(this,
+                              priors_shape[1].is_static() && priors_shape[1].get_length() == 4u,
+                              "The last dimension of the 'priors' input must be equal to 4. Got: ",
+                              priors_shape[1]);
+    }
 
     NODE_VALIDATION_CHECK(this, featmap_shape.rank().get_length() == 4, "Feature_map rank must be equal to 4.");
 
diff --git a/ngraph/core/src/op/experimental_detectron_topkrois.cpp b/ngraph/core/src/op/experimental_detectron_topkrois.cpp
index 0b970b3eed5..daf76a8761b 100644
--- a/ngraph/core/src/op/experimental_detectron_topkrois.cpp
+++ b/ngraph/core/src/op/experimental_detectron_topkrois.cpp
@@ -46,11 +46,12 @@ void op::v6::ExperimentalDetectronTopKROIs::validate_and_infer_types() {
                               input_rois_shape.rank().get_length() == 2,
                               "The 'input_rois' input is expected to be a 2D. Got: ",
                               input_rois_shape);
-
-        NODE_VALIDATION_CHECK(this,
-                              input_rois_shape[1] == 4,
-                              "The second dimension of 'input_rois' should be 4. Got: ",
-                              input_rois_shape[1]);
+        if (input_rois_shape.is_static()) {
+            NODE_VALIDATION_CHECK(this,
+                                  input_rois_shape[1] == 4,
+                                  "The second dimension of 'input_rois' should be 4. Got: ",
+                                  input_rois_shape[1]);
+        }
     }
     if (rois_probs_shape.rank().is_static()) {
         NODE_VALIDATION_CHECK(this,
diff --git a/ngraph/core/src/op/op.cpp b/ngraph/core/src/op/op.cpp
index 439353c30fc..174c724aa81 100644
--- a/ngraph/core/src/op/op.cpp
+++ b/ngraph/core/src/op/op.cpp
@@ -11,7 +11,6 @@
 #include "ngraph/node.hpp"
 #include "ngraph/type/element_type.hpp"
 
-using namespace ngraph;
 using namespace std;
 
-op::Op::Op(const OutputVector& args) : Node(args) {}
+ov::op::Op::Op(const ov::OutputVector& args) : Node(args) {}
diff --git a/ngraph/core/src/op/parameter.cpp b/ngraph/core/src/op/parameter.cpp
index f9b73421912..f86d45e6e8f 100644
--- a/ngraph/core/src/op/parameter.cpp
+++ b/ngraph/core/src/op/parameter.cpp
@@ -48,6 +48,20 @@ void op::Parameter::set_is_relevant_to_shapes(bool is_relevant) {
     m_is_relevant_to_shapes = is_relevant;
 }
 
+ov::Layout op::Parameter::get_layout() const {
+    auto it = get_output_tensor(0).get_rt_info().find("LAYOUT");
+    if (it == get_output_tensor(0).get_rt_info().end()) {
+        return ov::Layout();
+    }
+    auto layout = std::dynamic_pointer_cast<VariantWrapper<ov::Layout>>(it->second);
+    OPENVINO_ASSERT(layout, "'LAYOUT' runtime info for node is invalid, use set_layout API");
+    return layout->get();
+}
+
+void op::Parameter::set_layout(const ov::Layout& layout) {
+    get_output_tensor(0).get_rt_info()["LAYOUT"] = std::make_shared<VariantWrapper<ov::Layout>>(layout);
+}
+
 constexpr DiscreteTypeInfo ov::AttributeAdapter<ParameterVector>::type_info;
 
 ov::AttributeAdapter<ParameterVector>::AttributeAdapter(ParameterVector& ref) : m_ref(ref) {}
diff --git a/ngraph/core/src/opsets/opset.cpp b/ngraph/core/src/opsets/opset.cpp
index 72a23e9f74b..2a29ada7751 100644
--- a/ngraph/core/src/opsets/opset.cpp
+++ b/ngraph/core/src/opsets/opset.cpp
@@ -33,9 +33,9 @@ const ov::OpSet& ov::get_opset1() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#define _OPENVINO_OP_REG(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
 #include "openvino/opsets/opset1_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
     });
     return opset;
 }
@@ -44,9 +44,9 @@ const ov::OpSet& ov::get_opset2() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#define _OPENVINO_OP_REG(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
 #include "openvino/opsets/opset2_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
     });
     return opset;
 }
@@ -55,9 +55,9 @@ const ov::OpSet& ov::get_opset3() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#define _OPENVINO_OP_REG(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
 #include "openvino/opsets/opset3_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
     });
     return opset;
 }
@@ -66,9 +66,9 @@ const ov::OpSet& ov::get_opset4() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#define _OPENVINO_OP_REG(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
 #include "openvino/opsets/opset4_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
     });
     return opset;
 }
@@ -77,9 +77,9 @@ const ov::OpSet& ov::get_opset5() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#define _OPENVINO_OP_REG(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
 #include "openvino/opsets/opset5_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
     });
     return opset;
 }
@@ -88,9 +88,9 @@ const ov::OpSet& ov::get_opset6() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#define _OPENVINO_OP_REG(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
 #include "openvino/opsets/opset6_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
     });
     return opset;
 }
@@ -99,9 +99,9 @@ const ov::OpSet& ov::get_opset7() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#define _OPENVINO_OP_REG(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
 #include "openvino/opsets/opset7_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
     });
     return opset;
 }
@@ -110,9 +110,9 @@ const ov::OpSet& ov::get_opset8() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#define _OPENVINO_OP_REG(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
 #include "openvino/opsets/opset8_tbl.hpp"
-#undef OPENVINO_OP
+#undef _OPENVINO_OP_REG
     });
     return opset;
 }
diff --git a/ngraph/core/src/pass/manager.cpp b/ngraph/core/src/pass/manager.cpp
index 288003dd08a..8f3e0fd20d5 100644
--- a/ngraph/core/src/pass/manager.cpp
+++ b/ngraph/core/src/pass/manager.cpp
@@ -12,7 +12,6 @@
 #include <unordered_map>
 
 #include "itt.hpp"
-#include "ngraph/env_util.hpp"
 #include "ngraph/function.hpp"
 #include "ngraph/graph_util.hpp"
 #include "ngraph/log.hpp"
@@ -21,6 +20,7 @@
 #include "ngraph/pass/pass.hpp"
 #include "ngraph/pass/visualize_tree.hpp"
 #include "ngraph/util.hpp"
+#include "openvino/util/env_util.hpp"
 #include "perf_counters.hpp"
 
 using namespace std;
@@ -38,7 +38,7 @@ PerfCounters& perf_counters() {
 
 ov::pass::Manager::Manager()
     : m_pass_config(std::make_shared<PassConfig>()),
-      m_visualize(ngraph::getenv_bool("NGRAPH_ENABLE_VISUALIZE_TRACING")) {}
+      m_visualize(ov::util::getenv_bool("NGRAPH_ENABLE_VISUALIZE_TRACING")) {}
 
 ov::pass::Manager::~Manager() = default;
 
@@ -48,7 +48,7 @@ void ov::pass::Manager::run_passes(shared_ptr<ov::Function> func) {
     NGRAPH_SUPPRESS_DEPRECATED_START
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraph, "pass::Manager::run_passes");
 
-    static bool profile_enabled = ngraph::getenv_bool("NGRAPH_PROFILE_PASS_ENABLE");
+    static bool profile_enabled = ov::util::getenv_bool("NGRAPH_PROFILE_PASS_ENABLE");
 
     size_t index = 0;
     ngraph::stopwatch pass_timer;
@@ -114,7 +114,7 @@ void ov::pass::Manager::run_passes(shared_ptr<ov::Function> func) {
             auto base_filename = func->get_name() + std::string("_") + index_str + std::string("_") + pass->get_name();
 
             if (m_visualize) {
-                static const string format = ngraph::getenv_string("NGRAPH_VISUALIZE_TRACING_FORMAT");
+                static const string format = ov::util::getenv_string("NGRAPH_VISUALIZE_TRACING_FORMAT");
                 auto file_ext = format.empty() ? "svg" : format;
                 pass::VisualizeTree vt(base_filename + std::string(".") + file_ext);
                 vt.run_on_function(func);
diff --git a/ngraph/core/src/pattern/matcher.cpp b/ngraph/core/src/pattern/matcher.cpp
index dc24e44ae54..14afad25e5d 100644
--- a/ngraph/core/src/pattern/matcher.cpp
+++ b/ngraph/core/src/pattern/matcher.cpp
@@ -7,11 +7,11 @@
 #include <algorithm>
 #include <regex>
 
-#include "ngraph/env_util.hpp"
 #include "ngraph/graph_util.hpp"
 #include "ngraph/log.hpp"
 #include "ngraph/op/parameter.hpp"
 #include "ngraph/op/util/op_types.hpp"
+#include "openvino/util/env_util.hpp"
 
 namespace ov {
 namespace pass {
@@ -109,7 +109,7 @@ bool Matcher::match_value(const ngraph::Output<Node>& pattern_value, const ngrap
     // This env var allows one to specify node name patterns to abort pattern matching
     // at particular nodes. The upshot is that one can quickly zero in on an offending
     // fusion by disabling individual fusions or optimizations that use Matcher.
-    static const std::string node_skip_cregex = ngraph::getenv_string("NGRAPH_FAIL_MATCH_AT");
+    static const std::string node_skip_cregex = ov::util::getenv_string("NGRAPH_FAIL_MATCH_AT");
     if (!node_skip_cregex.empty()) {
         static const std::regex node_skip_regex(node_skip_cregex);
         if (std::regex_match(graph_node->get_name(), node_skip_regex)) {
diff --git a/ngraph/core/src/preprocess/pre_post_process.cpp b/ngraph/core/src/preprocess/pre_post_process.cpp
index 10b75c375ea..3b93c5e3771 100644
--- a/ngraph/core/src/preprocess/pre_post_process.cpp
+++ b/ngraph/core/src/preprocess/pre_post_process.cpp
@@ -6,108 +6,44 @@
 
 #include "ngraph/opsets/opset1.hpp"
 #include "openvino/core/function.hpp"
+#include "preprocess_steps_impl.hpp"
 
 namespace ov {
 namespace preprocess {
 
 /// \brief InputTensorInfoImpl - internal data structure
-struct InputTensorInfo::InputTensorInfoImpl {
+class InputTensorInfo::InputTensorInfoImpl {
+public:
     InputTensorInfoImpl() = default;
-    explicit InputTensorInfoImpl(const element::Type& type) : m_type(type) {}
 
+    void set_element_type(const element::Type& type) {
+        m_type = type;
+        m_type_set = true;
+    }
+    bool is_element_type_set() const {
+        return m_type_set;
+    }
+    const element::Type& get_element_type() const {
+        return m_type;
+    }
+
+    void set_layout(const Layout& layout) {
+        m_layout = layout;
+        m_layout_set = true;
+    }
+    bool is_layout_set() const {
+        return m_layout_set;
+    }
+    const Layout& get_layout() const {
+        return m_layout;
+    }
+
+private:
     element::Type m_type = element::dynamic;
+    bool m_type_set = false;
+
     Layout m_layout = Layout();
-};
-
-static int64_t get_channels_helper(const std::shared_ptr<Node>& node) {
-    auto it = node->get_rt_info().find("LAYOUT");
-    if (it == node->get_rt_info().end()) {
-        return -1;
-    }
-    auto layout = std::dynamic_pointer_cast<VariantWrapper<Layout>>(it->second);
-    OPENVINO_ASSERT(layout, "Layout runtime info for node is invalid");
-    if (!layout::has_channels(layout->get())) {
-        return -1;
-    }
-    return layout::channels(layout->get());
-}
-
-static Shape construct_mean_scale_shape(const std::shared_ptr<Node>& node, size_t values_size) {
-    // TODO: support also Mean/Scale image case
-    auto channels = get_channels_helper(node);
-    OPENVINO_ASSERT(channels >= 0, "Channels dimension is not specified in layout");
-    auto node_shape = node->get_output_partial_shape(0);
-    auto node_rank = node->get_output_partial_shape(0).rank();
-    OPENVINO_ASSERT(node_rank.is_static(), "Mean/scale vector operation is not supported for fully dynamic shape");
-    OPENVINO_ASSERT(node_rank.get_length() > channels, "Channels dimension is out of bounds");
-    OPENVINO_ASSERT(node_shape[channels] == values_size, "Number of channels and mean/values size mismatch");
-    std::vector<std::size_t> v(node_rank.get_length(), 1);
-    v[channels] = values_size;
-    return {v};
-}
-
-static void propagate_layout(const std::shared_ptr<Node>& src, const std::shared_ptr<Node>& dst) {
-    if (src->get_rt_info().count("LAYOUT")) {
-        dst->get_rt_info()["LAYOUT"] = src->get_rt_info()["LAYOUT"];
-    }
-}
-
-/// \brief PreProcessStepsImpl - internal data structure
-struct PreProcessSteps::PreProcessStepsImpl {
-    void add_scale_impl(const std::vector<float>& values) {
-        m_actions.emplace_back(std::make_tuple(
-            [values](const std::shared_ptr<Node>& node) {
-                Shape shape;
-                if (values.size() == 1) {
-                    shape = Shape{1};
-                } else {
-                    shape = construct_mean_scale_shape(node, values.size());
-                }
-                auto constant = op::v0::Constant::create(element::f32, shape, values);
-                constant->set_friendly_name(node->get_friendly_name() + "/scale/Divide_Factor");
-
-                auto new_op = std::make_shared<op::v1::Divide>(node, constant);
-                new_op->set_friendly_name(node->get_friendly_name() + "/scale/Divide");
-                propagate_layout(node, new_op);
-                return new_op;
-            },
-            false));
-    }
-
-    void add_mean_impl(const std::vector<float>& values) {
-        m_actions.emplace_back(std::make_tuple(
-            [values](const std::shared_ptr<Node>& node) {
-                Shape shape;
-                if (values.size() == 1) {
-                    shape = Shape{1};
-                } else {
-                    shape = construct_mean_scale_shape(node, values.size());
-                }
-                auto constant = op::v0::Constant::create(element::f32, shape, values);
-                constant->set_friendly_name(node->get_friendly_name() + "/mean/Mean_Const");
-
-                auto new_op = std::make_shared<op::v1::Subtract>(node, constant);
-                new_op->set_friendly_name(node->get_friendly_name() + "/mean/Subtract");
-                propagate_layout(node, new_op);
-                return new_op;
-            },
-            false));
-    }
-
-    void add_convert_impl(const element::Type& type) {
-        m_actions.emplace_back(std::make_tuple(
-            [type](const std::shared_ptr<Node>& node) {
-                if (node->get_element_type().is_dynamic()) {
-                    throw ngraph::ngraph_error("Can't insert 'convert_element_type' for dynamic source tensor type.");
-                }
-                auto convert = std::make_shared<op::v0::Convert>(node, type);
-                convert->set_friendly_name(node->get_friendly_name() + "/convert_element_type");
-                propagate_layout(node, convert);
-                return convert;
-            },
-            true));
-    }
-    std::list<std::tuple<PreProcessSteps::CustomPreprocessOp, bool>> m_actions;
+    bool m_layout_set = false;
 };
 
 /// \brief InputInfoImpl - internal data structure
@@ -119,9 +55,11 @@ struct InputInfo::InputInfoImpl {
         return m_has_index;
     }
 
-    void create_tensor_data(const element::Type& type) {
-        m_tensor_data =
-            std::unique_ptr<InputTensorInfo::InputTensorInfoImpl>(new InputTensorInfo::InputTensorInfoImpl(type));
+    void create_tensor_data(const element::Type& type, const Layout& layout) {
+        auto data = std::unique_ptr<InputTensorInfo::InputTensorInfoImpl>(new InputTensorInfo::InputTensorInfoImpl());
+        data->set_layout(layout);
+        data->set_element_type(type);
+        m_tensor_data = std::move(data);
     }
 
     bool m_has_index = false;
@@ -196,41 +134,47 @@ std::shared_ptr<Function> PrePostProcessor::build(const std::shared_ptr<Function
         }
         auto consumers = param->output(0).get_target_inputs();
         if (!input->m_tensor_data) {
-            input->create_tensor_data(param->get_element_type());
+            input->create_tensor_data(param->get_element_type(), param->get_layout());
+        }
+        if (!input->m_tensor_data->is_layout_set() && param->get_layout() != Layout()) {
+            input->m_tensor_data->set_layout(param->get_layout());
+        }
+        if (!input->m_tensor_data->is_element_type_set()) {
+            input->m_tensor_data->set_element_type(param->get_element_type());
         }
         auto new_param_shape = param->get_partial_shape();
-        auto new_param = std::make_shared<op::v0::Parameter>(input->m_tensor_data->m_type, new_param_shape);
-        if (input->m_tensor_data->m_layout != Layout()) {
-            new_param->get_rt_info()["LAYOUT"] =
-                std::make_shared<VariantWrapper<Layout>>(input->m_tensor_data->m_layout);
+        auto new_param = std::make_shared<op::v0::Parameter>(input->m_tensor_data->get_element_type(), new_param_shape);
+        if (input->m_tensor_data->is_layout_set()) {
+            new_param->set_layout(input->m_tensor_data->get_layout());
         }
         // Old param will be removed, so friendly name can be reused
         new_param->set_friendly_name(param->get_friendly_name());
-        std::shared_ptr<Node> node = new_param;
 
+        // Also reuse names of original tensor
+        new_param->get_output_tensor(0).set_names(param->get_output_tensor(0).get_names());
+
+        std::shared_ptr<Node> node = new_param;
+        PreprocessingContext context(new_param->get_layout());
         // 2. Apply preprocessing
-        for (const auto& action : input->m_preprocess->m_actions) {
-            node = std::get<0>(action)(node);
+        for (const auto& action : input->m_preprocess->actions()) {
+            node = std::get<0>(action)({node}, context);
             tensor_data_updated |= std::get<1>(action);
         }
 
         // Check final type
-        if (node->get_element_type() != param->get_element_type()) {
-            throw ngraph::ngraph_error(
-                std::string("Element type after preprocessing {") + node->get_element_type().c_type_string() +
-                std::string("} doesn't match with network element type {") + param->get_element_type().c_type_string() +
-                "}. Please add 'convert_element_type' explicitly");
-        }
+        OPENVINO_ASSERT(node->get_element_type() == param->get_element_type(),
+                        std::string("Element type after preprocessing {") + node->get_element_type().c_type_string() +
+                            std::string("} doesn't match with network element type {") +
+                            param->get_element_type().c_type_string() +
+                            "}. Please add 'convert_element_type' explicitly");
 
         // Replace parameter
         for (auto consumer : consumers) {
             consumer.replace_source_output(node);
         }
-        if (input->has_index()) {
-            function->replace_parameter(input->m_index, new_param);
-        } else {
-            function->replace_parameter(0, new_param);
-        }
+        function->add_parameters({new_param});
+        // remove old parameter
+        function->remove_parameter(param);
     }
     if (tensor_data_updated) {
         function->validate_nodes_and_infer_types();
@@ -245,22 +189,22 @@ InputTensorInfo& InputTensorInfo::operator=(InputTensorInfo&&) noexcept = defaul
 InputTensorInfo::~InputTensorInfo() = default;
 
 InputTensorInfo& InputTensorInfo::set_element_type(const element::Type& type) & {
-    m_impl->m_type = type;
+    m_impl->set_element_type(type);
     return *this;
 }
 
 InputTensorInfo&& InputTensorInfo::set_element_type(const element::Type& type) && {
-    m_impl->m_type = type;
+    m_impl->set_element_type(type);
     return std::move(*this);
 }
 
 InputTensorInfo& InputTensorInfo::set_layout(const Layout& layout) & {
-    m_impl->m_layout = layout;
+    m_impl->set_layout(layout);
     return *this;
 }
 
 InputTensorInfo&& InputTensorInfo::set_layout(const Layout& layout) && {
-    m_impl->m_layout = layout;
+    m_impl->set_layout(layout);
     return std::move(*this);
 }
 
@@ -323,13 +267,27 @@ PreProcessSteps&& PreProcessSteps::convert_element_type(const element::Type& typ
 
 PreProcessSteps& PreProcessSteps::custom(const CustomPreprocessOp& preprocess_cb) & {
     // 'true' indicates that custom preprocessing step will trigger validate_and_infer_types
-    m_impl->m_actions.emplace_back(std::make_tuple(preprocess_cb, true));
+    m_impl->actions().emplace_back(std::make_tuple(
+        [preprocess_cb](const std::vector<std::shared_ptr<ov::Node>>& nodes, PreprocessingContext&) {
+            OPENVINO_ASSERT(nodes.size() == 1,
+                            "Can't apply custom preprocessing step for multi-plane input. Suggesting to convert "
+                            "current image to RGB/BGR color format using 'convert_color'");
+            return preprocess_cb(nodes[0]);
+        },
+        true));
     return *this;
 }
 
 PreProcessSteps&& PreProcessSteps::custom(const CustomPreprocessOp& preprocess_cb) && {
     // 'true' indicates that custom preprocessing step will trigger validate_and_infer_types
-    m_impl->m_actions.emplace_back(std::make_tuple(preprocess_cb, true));
+    m_impl->actions().emplace_back(std::make_tuple(
+        [preprocess_cb](const std::vector<std::shared_ptr<ov::Node>>& nodes, PreprocessingContext&) {
+            OPENVINO_ASSERT(nodes.size() == 1,
+                            "Can't apply custom preprocessing step for multi-plane input. Suggesting to convert "
+                            "current image to RGB/BGR color format using 'convert_color'");
+            return preprocess_cb(nodes[0]);
+        },
+        true));
     return std::move(*this);
 }
 
diff --git a/ngraph/core/src/preprocess/preprocess_steps_impl.cpp b/ngraph/core/src/preprocess/preprocess_steps_impl.cpp
new file mode 100644
index 00000000000..675278b5242
--- /dev/null
+++ b/ngraph/core/src/preprocess/preprocess_steps_impl.cpp
@@ -0,0 +1,99 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "preprocess_steps_impl.hpp"
+
+#include "ngraph/opsets/opset1.hpp"
+#include "openvino/core/node.hpp"
+#include "openvino/core/shape.hpp"
+
+using namespace ov;
+using namespace ov::preprocess;
+
+static Shape construct_mean_scale_shape(const std::shared_ptr<Node>& node,
+                                        size_t values_size,
+                                        const PreprocessingContext& context) {
+    // TODO: support also Mean/Scale image case
+    OPENVINO_ASSERT(layout::has_channels(context.layout()), "Channels dimension is not specified in layout");
+    auto channels_index = layout::channels(context.layout());
+    auto node_shape = node->get_output_partial_shape(0);
+    auto node_rank = node->get_output_partial_shape(0).rank();
+    OPENVINO_ASSERT(node_rank.is_static(), "Mean/scale vector operation is not supported for fully dynamic shape");
+    std::vector<std::size_t> v(node_rank.get_length(), 1);
+    if (channels_index < 0) {
+        // E.g. channels_index = -1 means last dimension
+        channels_index = node_rank.get_length() + channels_index;
+    }
+    OPENVINO_ASSERT(node_rank.get_length() > channels_index, "Channels dimension is out of bounds");
+
+    OPENVINO_ASSERT(node_shape[channels_index].is_dynamic() || node_shape[channels_index] == values_size,
+                    "Number of channels and mean/values size mismatch: Channels = ",
+                    node_shape[channels_index].get_length(),
+                    ", mean/scale = ",
+                    values_size);
+    v[channels_index] = values_size;
+    return {v};
+}
+
+void PreProcessSteps::PreProcessStepsImpl::add_scale_impl(const std::vector<float>& values) {
+    m_actions.emplace_back(std::make_tuple(
+        [values](const std::vector<std::shared_ptr<Node>>& nodes, PreprocessingContext& context) {
+            OPENVINO_ASSERT(!nodes.empty(), "Internal error: Can't apply scale preprocessing for empty input.");
+            OPENVINO_ASSERT(nodes.size() == 1,
+                            "Can't apply scale preprocessing for multi-plane input. Suggesting to convert current "
+                            "image to RGB/BGR color format using 'convert_color'");
+            Shape shape;
+            if (values.size() == 1) {
+                shape = Shape{1};
+            } else {
+                shape = construct_mean_scale_shape(nodes[0], values.size(), context);
+            }
+            auto constant = op::v0::Constant::create(element::f32, shape, values);
+            constant->set_friendly_name(nodes[0]->get_friendly_name() + "/scale/Divide_Factor");
+
+            auto new_op = std::make_shared<op::v1::Divide>(nodes[0], constant);
+            new_op->set_friendly_name(nodes[0]->get_friendly_name() + "/scale/Divide");
+            return new_op;
+        },
+        false));
+}
+
+void PreProcessSteps::PreProcessStepsImpl::add_mean_impl(const std::vector<float>& values) {
+    m_actions.emplace_back(std::make_tuple(
+        [values](const std::vector<std::shared_ptr<Node>>& nodes, PreprocessingContext& context) {
+            OPENVINO_ASSERT(!nodes.empty(), "Internal error: Can't apply mean preprocessing for empty input.");
+            OPENVINO_ASSERT(nodes.size() == 1,
+                            "Can't apply scale preprocessing for multi-plane input. Suggesting to convert current "
+                            "image to RGB/BGR color format using 'convert_color'");
+            Shape shape;
+            if (values.size() == 1) {
+                shape = Shape{1};
+            } else {
+                shape = construct_mean_scale_shape(nodes[0], values.size(), context);
+            }
+            auto constant = op::v0::Constant::create(element::f32, shape, values);
+            constant->set_friendly_name(nodes[0]->get_friendly_name() + "/mean/Mean_Const");
+
+            auto new_op = std::make_shared<op::v1::Subtract>(nodes[0], constant);
+            new_op->set_friendly_name(nodes[0]->get_friendly_name() + "/mean/Subtract");
+            return new_op;
+        },
+        false));
+}
+
+void PreProcessSteps::PreProcessStepsImpl::add_convert_impl(const ov::element::Type& type) {
+    m_actions.emplace_back(std::make_tuple(
+        [type](const std::vector<std::shared_ptr<Node>>& nodes, PreprocessingContext&) {
+            OPENVINO_ASSERT(!nodes.empty(), "Internal error: Can't set element type for empty input.");
+            OPENVINO_ASSERT(nodes.size() == 1,
+                            "Can't set element type for multi-plane input. Suggesting to convert current image to "
+                            "RGB/BGR color format using 'convert_color'");
+            OPENVINO_ASSERT(nodes[0]->get_element_type().is_static(),
+                            "Can't insert 'convert_element_type' for dynamic source tensor type.");
+            auto convert = std::make_shared<op::v0::Convert>(nodes[0], type);
+            convert->set_friendly_name(nodes[0]->get_friendly_name() + "/convert_element_type");
+            return convert;
+        },
+        true));
+}
diff --git a/ngraph/core/src/preprocess/preprocess_steps_impl.hpp b/ngraph/core/src/preprocess/preprocess_steps_impl.hpp
new file mode 100644
index 00000000000..c4291a6758c
--- /dev/null
+++ b/ngraph/core/src/preprocess/preprocess_steps_impl.hpp
@@ -0,0 +1,56 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <list>
+
+#include "openvino/core/layout.hpp"
+#include "openvino/core/preprocess/preprocess_steps.hpp"
+
+namespace ov {
+namespace preprocess {
+
+/// \brief Preprocessing context passed to each preprocessing operation.
+/// This is internal structure which is not shared to custom operations yet.
+class PreprocessingContext {
+public:
+    explicit PreprocessingContext(const Layout& layout) : m_layout(layout) {}
+
+    const Layout& layout() const {
+        return m_layout;
+    }
+
+    Layout& layout() {
+        return m_layout;
+    }
+
+private:
+    Layout m_layout;
+};
+
+using InternalPreprocessOp =
+    std::function<std::shared_ptr<ov::Node>(const std::vector<std::shared_ptr<ov::Node>>& nodes,
+                                            PreprocessingContext& context)>;
+
+/// \brief PreProcessStepsImpl - internal data structure
+class PreProcessSteps::PreProcessStepsImpl {
+public:
+    void add_scale_impl(const std::vector<float>& values);
+    void add_mean_impl(const std::vector<float>& values);
+    void add_convert_impl(const element::Type& type);
+
+    const std::list<std::tuple<InternalPreprocessOp, bool>>& actions() const {
+        return m_actions;
+    }
+    std::list<std::tuple<InternalPreprocessOp, bool>>& actions() {
+        return m_actions;
+    }
+
+private:
+    std::list<std::tuple<InternalPreprocessOp, bool>> m_actions;
+};
+
+}  // namespace preprocess
+}  // namespace ov
diff --git a/ngraph/core/src/type.cpp b/ngraph/core/src/type.cpp
index 5456fb8d1e4..9efa977ccbe 100644
--- a/ngraph/core/src/type.cpp
+++ b/ngraph/core/src/type.cpp
@@ -16,3 +16,50 @@ size_t std::hash<ngraph::DiscreteTypeInfo>::operator()(const ngraph::DiscreteTyp
     NGRAPH_SUPPRESS_DEPRECATED_END
 }
 }  // namespace std
+
+namespace ov {
+std::ostream& operator<<(std::ostream& s, const DiscreteTypeInfo& info) {
+    std::string version_id = info.version_id ? info.version_id : "(empty)";
+    s << "DiscreteTypeInfo{name: " << info.name << ", version_id: " << version_id << ", old_version: " << info.version
+      << ", parent: ";
+    if (!info.parent)
+        s << info.parent;
+    else
+        s << *info.parent;
+
+    s << "}";
+    return s;
+}
+
+// parent is commented to fix type relaxed operations
+bool DiscreteTypeInfo::operator<(const DiscreteTypeInfo& b) const {
+    if (version_id == nullptr || b.version_id == nullptr)
+        return version < b.version ||
+               (version == b.version && strcmp(name, b.name) < 0);  // ||
+                                                                    // (version == b.version && strcmp(name, b.name) ==
+                                                                    // 0 && parent && b.parent && *parent < *b.parent);
+    else
+        return strcmp(version_id, b.version_id) < 0 ||
+               (strcmp(version_id, b.version_id) == 0 && strcmp(name, b.name) < 0);  // ||
+    // (strcmp(version_id, b.version_id) == 0 && strcmp(name, b.name) == 0 && parent && b.parent &&
+    //  *parent < *b.parent);
+}
+bool DiscreteTypeInfo::operator==(const DiscreteTypeInfo& b) const {
+    if (version_id == nullptr || b.version_id == nullptr)
+        return version == b.version && strcmp(name, b.name) == 0;  // && parent == b.parent;
+    else
+        return strcmp(version_id, b.version_id) == 0 && strcmp(name, b.name) == 0;  // && parent == b.parent;
+}
+bool DiscreteTypeInfo::operator<=(const DiscreteTypeInfo& b) const {
+    return *this == b || *this < b;
+}
+bool DiscreteTypeInfo::operator>(const DiscreteTypeInfo& b) const {
+    return !(*this <= b);
+}
+bool DiscreteTypeInfo::operator>=(const DiscreteTypeInfo& b) const {
+    return !(*this < b);
+}
+bool DiscreteTypeInfo::operator!=(const DiscreteTypeInfo& b) const {
+    return !(*this == b);
+}
+}  // namespace ov
diff --git a/ngraph/core/src/util.cpp b/ngraph/core/src/util.cpp
index 4dcf3abb220..563c63bf794 100644
--- a/ngraph/core/src/util.cpp
+++ b/ngraph/core/src/util.cpp
@@ -21,6 +21,7 @@
 #include "ngraph/op/result.hpp"
 #include "ngraph/partial_shape.hpp"
 #include "ngraph/shape.hpp"
+#include "openvino/util/common_util.hpp"
 
 NGRAPH_SUPPRESS_DEPRECATED_START
 using namespace std;
@@ -61,54 +62,19 @@ void ngraph::dump(ostream& out, const void* _data, size_t _size) {
 }
 
 std::string ngraph::to_lower(const std::string& s) {
-    std::string rc = s;
-    std::transform(rc.begin(), rc.end(), rc.begin(), ::tolower);
-    return rc;
+    return ov::util::to_lower(s);
 }
 
 std::string ngraph::to_upper(const std::string& s) {
-    std::string rc = s;
-    std::transform(rc.begin(), rc.end(), rc.begin(), ::toupper);
-    return rc;
+    return ov::util::to_upper(s);
 }
 
 string ngraph::trim(const string& s) {
-    string rc = s;
-    // trim trailing spaces
-    size_t pos = rc.find_last_not_of(" \t");
-    if (string::npos != pos) {
-        rc = rc.substr(0, pos + 1);
-    }
-
-    // trim leading spaces
-    pos = rc.find_first_not_of(" \t");
-    if (string::npos != pos) {
-        rc = rc.substr(pos);
-    }
-    return rc;
+    return ov::util::trim(s);
 }
 
 vector<string> ngraph::split(const string& src, char delimiter, bool do_trim) {
-    size_t pos;
-    string token;
-    size_t start = 0;
-    vector<string> rc;
-    while ((pos = src.find(delimiter, start)) != std::string::npos) {
-        token = src.substr(start, pos - start);
-        start = pos + 1;
-        if (do_trim) {
-            token = trim(token);
-        }
-        rc.push_back(token);
-    }
-    if (start <= src.size()) {
-        token = src.substr(start);
-        if (do_trim) {
-            token = trim(token);
-        }
-        rc.push_back(token);
-    }
-    return rc;
+    return ov::util::split(src, delimiter, do_trim);
 }
 
 size_t ngraph::hash_combine(const std::vector<size_t>& list) {
diff --git a/ngraph/core/src/validation_util.cpp b/ngraph/core/src/validation_util.cpp
index ff69f511059..97881a5379a 100644
--- a/ngraph/core/src/validation_util.cpp
+++ b/ngraph/core/src/validation_util.cpp
@@ -297,14 +297,14 @@ PartialShape ngraph::validate_and_infer_convolution_forward_output_shape(const N
 //
 // Infers the output batch shape and element type for convolution fprop.
 //
-PartialShape ngraph::infer_convolution_forward(const Node* node,
-                                               const PartialShape& data_batch_shape,
-                                               const Strides& data_dilation,
-                                               const CoordinateDiff& data_padding_below,
-                                               const CoordinateDiff& data_padding_above,
-                                               const PartialShape& filters_shape,
-                                               const Strides& filter_strides,
-                                               const Strides& filter_dilation) {
+PartialShape ov::infer_convolution_forward(const Node* node,
+                                           const PartialShape& data_batch_shape,
+                                           const Strides& data_dilation,
+                                           const CoordinateDiff& data_padding_below,
+                                           const CoordinateDiff& data_padding_above,
+                                           const PartialShape& filters_shape,
+                                           const Strides& filter_strides,
+                                           const Strides& filter_dilation) {
     Rank data_batch_filters_rank{Rank::dynamic()};
 
     NODE_VALIDATION_CHECK(node,
@@ -643,13 +643,13 @@ std::tuple<element::Type, PartialShape, PartialShape> ngraph::infer_batch_norm_f
         {{gamma_element_type, gamma_shape, "gamma"}, {beta_element_type, beta_shape, "beta"}});
 }
 
-void ngraph::infer_auto_padding(const Shape& image_shape,
-                                const Shape& filter_shape,
-                                const Strides& filter_strides,
-                                const Strides& filter_dilations,
-                                const op::PadType pad_type,
-                                CoordinateDiff& padding_above,
-                                CoordinateDiff& padding_below) {
+void ov::infer_auto_padding(const Shape& image_shape,
+                            const Shape& filter_shape,
+                            const Strides& filter_strides,
+                            const Strides& filter_dilations,
+                            const op::PadType pad_type,
+                            CoordinateDiff& padding_above,
+                            CoordinateDiff& padding_below) {
     const auto image_dims = std::vector<Dimension>(std::begin(image_shape), std::end(image_shape));
     // because image_shape is fully known result of try_apply_infer_auto_padding is ignored
     try_apply_auto_padding(image_dims,
@@ -676,9 +676,9 @@ bool ngraph::try_apply_auto_padding(const PartialShape& image_shape,
     const auto image_dims = static_cast<std::vector<Dimension>>(image_shape);
     for (size_t i = 0; i < static_cast<size_t>(filter_shape.size()); i++) {
         if (image_dims[i + 2].is_static()) {
-            int64_t image_size = static_cast<int64_t>(image_dims[i + 2].get_length());
+            auto image_size = static_cast<int64_t>(image_dims[i + 2].get_length());
             int64_t filter_size = (static_cast<int64_t>(filter_shape[i]) - 1) * filter_dilations[i] + 1;
-            int64_t filter_stride = static_cast<int64_t>(filter_strides[i]);
+            auto filter_stride = static_cast<int64_t>(filter_strides[i]);
             auto output_size = (image_size + filter_stride - 1) / filter_stride;
 
             auto padding_needed = std::max(int64_t(0), (output_size - 1) * filter_stride + filter_size - image_size);
@@ -847,9 +847,9 @@ PartialShape ngraph::infer_slice_shape(const Node* node,
     return dim;
 }
 
-std::vector<size_t> ngraph::normalize_axes(const std::string& node_description,
-                                           const std::vector<int64_t>& axes,
-                                           const Rank& tensor_rank) {
+std::vector<size_t> ov::normalize_axes(const std::string& node_description,
+                                       const std::vector<int64_t>& axes,
+                                       const Rank& tensor_rank) {
     std::vector<size_t> new_axes;
 
     for (const auto& axis : axes) {
@@ -859,11 +859,11 @@ std::vector<size_t> ngraph::normalize_axes(const std::string& node_description,
     return new_axes;
 }
 
-int64_t ngraph::normalize_axis(const Node* node, std::int64_t axis, const Rank& tensor_rank) {
+int64_t ov::normalize_axis(const Node* node, std::int64_t axis, const Rank& tensor_rank) {
     return normalize_axis(node->description(), axis, tensor_rank);
 }
 
-int64_t ngraph::normalize_axis(const std::string& node_description, std::int64_t axis, const Rank& tensor_rank) {
+int64_t ov::normalize_axis(const std::string& node_description, std::int64_t axis, const Rank& tensor_rank) {
     if (axis < 0) {
         // Handling negative axis requires static tensor rank
         NGRAPH_CHECK(tensor_rank.is_static(),
@@ -883,19 +883,19 @@ int64_t ngraph::normalize_axis(const std::string& node_description, std::int64_t
                           tensor_rank_value ? (tensor_rank_value - 1) : 0);
 }
 
-int64_t ngraph::normalize_axis(const Node* node,
-                               std::int64_t axis,
-                               std::uint64_t tensor_rank,
-                               std::int64_t axis_range_min,
-                               std::int64_t axis_range_max) {
+int64_t ov::normalize_axis(const Node* node,
+                           std::int64_t axis,
+                           std::uint64_t tensor_rank,
+                           std::int64_t axis_range_min,
+                           std::int64_t axis_range_max) {
     return ngraph::normalize_axis(node->description(), axis, tensor_rank, axis_range_min, axis_range_max);
 }
 
-int64_t ngraph::normalize_axis(const std::string& node_description,
-                               std::int64_t axis,
-                               std::uint64_t tensor_rank,
-                               std::int64_t axis_range_min,
-                               std::int64_t axis_range_max) {
+int64_t ov::normalize_axis(const std::string& node_description,
+                           std::int64_t axis,
+                           std::uint64_t tensor_rank,
+                           std::int64_t axis_range_min,
+                           std::int64_t axis_range_max) {
     // Accepted range of value for axis is [axis_range_min, axis_range_max].
     NGRAPH_CHECK(((axis >= axis_range_min) && (axis <= axis_range_max)),
                  node_description,
@@ -954,7 +954,7 @@ namespace {
 /// For tensor values, we use the maximum value in the tensor
 struct MaxValue {
     /// \brief No information known about the output
-    MaxValue() {}
+    MaxValue() = default;
     /// \brief uint64_t assoiated with the output
     MaxValue(uint64_t value) : m_value(value) {}
     MaxValue(const vector<uint64_t>& slices, int64_t slice_axis) : m_slices(slices), m_slice_axis(slice_axis) {
@@ -1027,7 +1027,7 @@ vector<MaxValue> exec_minimum(Node* node, vector<MaxValue>& inputs) {
 vector<MaxValue> exec_concat(Node* node, vector<MaxValue>& inputs) {
     auto op = ov::as_type<op::v0::Concat>(node);
     vector<uint64_t> slice_maxen;
-    for (auto input : inputs) {
+    for (const auto& input : inputs) {
         slice_maxen.push_back(input.m_value);
     }
     auto axis = op->get_concatenation_axis();
@@ -1039,7 +1039,7 @@ vector<MaxValue> exec_reduce_min(Node* node, vector<MaxValue>& inputs) {
     if (data.m_slice_axis >= 0 && data.m_slices.size() > 1) {
         if (auto indices_const = ov::as_type<op::v0::Constant>(node->get_input_node_ptr(1))) {
             if (indices_const->get_output_element_type(0).is_integral()) {
-                auto indices_shape = indices_const->get_output_shape(0);
+                const auto& indices_shape = indices_const->get_output_shape(0);
                 if (indices_shape == Shape{1}) {
                     auto indices = indices_const->cast_vector<int64_t>();
                     auto axis = indices.at(0);
@@ -1254,13 +1254,13 @@ pair<HostTensorPtr, HostTensorPtr> ngraph::evaluate_both_bounds(const Output<Nod
     return {evaluate_lower_bound(output), evaluate_upper_bound(output)};
 }
 
-bool ngraph::evaluate_as_partial_shape(const Output<Node>& output, PartialShape& pshape) {
+bool ov::evaluate_as_partial_shape(const Output<Node>& output, PartialShape& pshape) {
     HostTensorPtr lb, ub;
     std::tie(lb, ub) = evaluate_both_bounds(output);
     bool shape_defined = false;
     if (lb && ub) {
-        const auto lower_bound = std::make_shared<op::Constant>(lb)->cast_vector<int64_t>();
-        const auto upper_bound = std::make_shared<op::Constant>(ub)->cast_vector<int64_t>();
+        const auto lower_bound = std::make_shared<op::v0::Constant>(lb)->cast_vector<int64_t>();
+        const auto upper_bound = std::make_shared<op::v0::Constant>(ub)->cast_vector<int64_t>();
         NGRAPH_CHECK(lower_bound.size() == upper_bound.size());
         vector<Dimension> resulting_pshape(lower_bound.size());
         for (size_t i = 0; i < lower_bound.size(); ++i) {
@@ -1497,12 +1497,12 @@ bool ngraph::has_and_set_equal_bounds(const Output<Node>& source) {
     return lb && lb == ub;
 }
 
-shared_ptr<op::Constant> ngraph::get_constant_from_source(const Output<Node>& source) {
+shared_ptr<op::Constant> ov::get_constant_from_source(const Output<Node>& source) {
     if (!has_and_set_equal_bounds(source))
         return nullptr;
-    if (const auto& c = ov::as_type_ptr<op::Constant>(source.get_node_shared_ptr()))
+    if (const auto& c = ov::as_type_ptr<op::v0::Constant>(source.get_node_shared_ptr()))
         return c;
-    return std::make_shared<op::Constant>(source.get_tensor().get_upper_value());
+    return std::make_shared<op::v0::Constant>(source.get_tensor().get_upper_value());
 }
 
 bool ngraph::validate_host_tensor_vector(const HostTensorVector& tensor_vector, const size_t& size) {
diff --git a/ngraph/frontend/CMakeLists.txt b/ngraph/frontend/CMakeLists.txt
index 6ab49ec2f70..5fc5c2b1fb2 100644
--- a/ngraph/frontend/CMakeLists.txt
+++ b/ngraph/frontend/CMakeLists.txt
@@ -14,6 +14,6 @@ if (NGRAPH_PDPD_FRONTEND_ENABLE)
     add_subdirectory(paddlepaddle)
 endif()
 
-if (IR_FRONTEND_ENABLE)
+if (NGRAPH_IR_FRONTEND_ENABLE)
     add_subdirectory(ir)
 endif()
diff --git a/ngraph/frontend/frontend_manager/CMakeLists.txt b/ngraph/frontend/frontend_manager/CMakeLists.txt
index feee88b695b..e91f0527d11 100644
--- a/ngraph/frontend/frontend_manager/CMakeLists.txt
+++ b/ngraph/frontend/frontend_manager/CMakeLists.txt
@@ -18,7 +18,7 @@ source_group("public include" FILES ${LIBRARY_PUBLIC_HEADERS})
 
 add_library(${TARGET_NAME}_static STATIC ${LIBRARY_SRC} ${LIBRARY_HEADERS} ${LIBRARY_PUBLIC_HEADERS})
 add_library(${TARGET_NAME}::static ALIAS ${TARGET_NAME}_static)
-target_link_libraries(${TARGET_NAME}_static PRIVATE ${CMAKE_DL_LIBS} PUBLIC ngraph)
+target_link_libraries(${TARGET_NAME}_static PRIVATE ${CMAKE_DL_LIBS} openvino::util PUBLIC ngraph)
 target_include_directories(${TARGET_NAME}_static PUBLIC ${FRONTEND_INCLUDE_DIR})
 target_include_directories(${TARGET_NAME}_static PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/src)
 target_compile_definitions(${TARGET_NAME}_static PUBLIC USE_STATIC_FRONTEND_MANAGER)
@@ -34,7 +34,7 @@ target_include_directories(${TARGET_NAME} PUBLIC
         $<BUILD_INTERFACE:${FRONTEND_INCLUDE_DIR}>
         $<INSTALL_INTERFACE:${FRONTEND_INSTALL_INCLUDE}>)
 target_include_directories(${TARGET_NAME} PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/src)
-target_link_libraries(${TARGET_NAME} PRIVATE ${CMAKE_DL_LIBS} PUBLIC ngraph)
+target_link_libraries(${TARGET_NAME} PRIVATE ${CMAKE_DL_LIBS} openvino::util PUBLIC ngraph)
 
 add_clang_format_target(${TARGET_NAME}_clang FOR_TARGETS ${TARGET_NAME})
 
diff --git a/ngraph/frontend/frontend_manager/include/frontend_manager/frontend.hpp b/ngraph/frontend/frontend_manager/include/frontend_manager/frontend.hpp
index 588a38209da..bd92665030e 100644
--- a/ngraph/frontend/frontend_manager/include/frontend_manager/frontend.hpp
+++ b/ngraph/frontend/frontend_manager/include/frontend_manager/frontend.hpp
@@ -34,7 +34,7 @@ public:
     /// \return true if model recognized, false - otherwise.
     template <typename... Types>
     inline bool supported(const Types&... vars) const {
-        return supported_impl({make_variant(vars)...});
+        return supported_impl({ov::make_variant(vars)...});
     }
 
     /// \brief Loads an input model by any specified arguments. Each FrontEnd separately
@@ -46,7 +46,11 @@ public:
     /// \return Loaded input model.
     template <typename... Types>
     inline InputModel::Ptr load(const Types&... vars) const {
-        return load_impl({make_variant(vars)...});
+        return load_impl({ov::make_variant(vars)...});
+    }
+
+    inline InputModel::Ptr load(const ov::VariantVector& vars) const {
+        return load_impl(vars);
     }
 
     /// \brief Completely convert and normalize entire function, throws if it is not
diff --git a/ngraph/frontend/frontend_manager/include/frontend_manager/frontend_manager.hpp b/ngraph/frontend/frontend_manager/include/frontend_manager/frontend_manager.hpp
index ba4183b0b74..aaa51f7a0de 100644
--- a/ngraph/frontend/frontend_manager/include/frontend_manager/frontend_manager.hpp
+++ b/ngraph/frontend/frontend_manager/include/frontend_manager/frontend_manager.hpp
@@ -11,6 +11,7 @@
 #include "frontend.hpp"
 #include "frontend_manager_defs.hpp"
 #include "ngraph/variant.hpp"
+#include "parameters.hpp"
 
 namespace ngraph {
 namespace frontend {
@@ -77,6 +78,9 @@ private:
     std::unique_ptr<Impl> m_impl;
 };
 
+template <>
+FrontEnd::Ptr FrontEndManager::load_by_model(const std::vector<std::shared_ptr<Variant>>& variants);
+
 // --------- Plugin exporting information --------------
 
 /// \brief Each frontend plugin is responsible to export GetAPIVersion function returning
@@ -95,29 +99,3 @@ struct FrontEndPluginInfo {
 
 }  // namespace frontend
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class FRONTEND_API VariantWrapper<std::istream*> : public VariantImpl<std::istream*> {
-public:
-    static constexpr VariantTypeInfo type_info{"Variant::std::istream*", 0};
-    const VariantTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
-};
-
-#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-template <>
-class FRONTEND_API VariantWrapper<std::wstring> : public VariantImpl<std::wstring> {
-public:
-    static constexpr VariantTypeInfo type_info{"Variant::std::wstring", 0};
-    const VariantTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
-};
-#endif
-
-}  // namespace ov
diff --git a/ngraph/frontend/frontend_manager/include/frontend_manager/parameters.hpp b/ngraph/frontend/frontend_manager/include/frontend_manager/parameters.hpp
new file mode 100644
index 00000000000..58b6a58f4c4
--- /dev/null
+++ b/ngraph/frontend/frontend_manager/include/frontend_manager/parameters.hpp
@@ -0,0 +1,78 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <sstream>
+#include <string>
+
+#include "frontend_manager_defs.hpp"
+#include "ngraph/op/constant.hpp"
+#include "ngraph/opsets/opset.hpp"
+#include "openvino/core/variant.hpp"
+
+namespace ov {
+
+template <>
+class FRONTEND_API VariantWrapper<std::istream*> : public VariantImpl<std::istream*> {
+public:
+    static constexpr VariantTypeInfo type_info{"Variant::std::istream*", 0};
+    const VariantTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+    VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
+};
+
+template <>
+class FRONTEND_API VariantWrapper<std::istringstream*> : public VariantImpl<std::istringstream*> {
+public:
+    static constexpr VariantTypeInfo type_info{"Variant::std::istringstream*", 0};
+    const VariantTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+    VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
+};
+
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+template <>
+class FRONTEND_API VariantWrapper<std::wstring> : public VariantImpl<std::wstring> {
+public:
+    static constexpr VariantTypeInfo type_info{"Variant::std::wstring", 0};
+    const VariantTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+    VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
+};
+#endif
+
+template <>
+class FRONTEND_API VariantWrapper<std::shared_ptr<ngraph::runtime::AlignedBuffer>>
+    : public VariantImpl<std::shared_ptr<ngraph::runtime::AlignedBuffer>> {
+public:
+    static constexpr VariantTypeInfo type_info{"Variant::Weights", 0};
+    const VariantTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+    VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
+};
+
+using Weights = std::shared_ptr<ngraph::runtime::AlignedBuffer>;
+using WeightsVariant = VariantWrapper<Weights>;
+
+template <>
+class FRONTEND_API VariantWrapper<std::map<std::string, ngraph::OpSet>>
+    : public VariantImpl<std::map<std::string, ngraph::OpSet>> {
+public:
+    static constexpr VariantTypeInfo type_info{"Variant::Extensions", 0};
+    const VariantTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+    VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
+};
+
+using Extensions = std::map<std::string, ngraph::OpSet>;
+using ExtensionsVariant = VariantWrapper<Extensions>;
+
+}  // namespace ov
\ No newline at end of file
diff --git a/ngraph/frontend/frontend_manager/src/frontend_manager.cpp b/ngraph/frontend/frontend_manager/src/frontend_manager.cpp
index e48403678c6..a5fbc864b69 100644
--- a/ngraph/frontend/frontend_manager/src/frontend_manager.cpp
+++ b/ngraph/frontend/frontend_manager/src/frontend_manager.cpp
@@ -5,8 +5,8 @@
 #include "frontend_manager/frontend_manager.hpp"
 
 #include <frontend_manager/place.hpp>
-#include <ngraph/env_util.hpp>
 #include <ngraph/except.hpp>
+#include <openvino/util/env_util.hpp>
 
 #include "frontend_manager/frontend_exceptions.hpp"
 #include "plugin_loader.hpp"
@@ -72,7 +72,7 @@ private:
                 }
             }
         };
-        std::string env_path = ngraph::getenv_string("OV_FRONTEND_PATH");
+        std::string env_path = ov::util::getenv_string("OV_FRONTEND_PATH");
         if (!env_path.empty()) {
             auto start = 0u;
             auto sep_pos = env_path.find(PathSeparator, start);
@@ -111,6 +111,11 @@ void FrontEndManager::register_front_end(const std::string& name, FrontEndFactor
     m_impl->register_front_end(name, creator);
 }
 
+template <>
+FrontEnd::Ptr FrontEndManager::load_by_model(const std::vector<std::shared_ptr<Variant>>& variants) {
+    return load_by_model_impl(variants);
+}
+
 //----------- FrontEnd ---------------------------
 
 FrontEnd::FrontEnd() = default;
@@ -372,9 +377,3 @@ Place::Ptr Place::get_producing_operation(const std::string& inputName, int inpu
 std::vector<Place::Ptr> Place::get_consuming_operations(const std::string& outputPortName) const {
     return {};
 }
-
-constexpr VariantTypeInfo VariantWrapper<std::istream*>::type_info;
-
-#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-constexpr VariantTypeInfo VariantWrapper<std::wstring>::type_info;
-#endif
diff --git a/ngraph/frontend/frontend_manager/src/parameters.cpp b/ngraph/frontend/frontend_manager/src/parameters.cpp
new file mode 100644
index 00000000000..b748208f38e
--- /dev/null
+++ b/ngraph/frontend/frontend_manager/src/parameters.cpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "frontend_manager/parameters.hpp"
+
+using namespace ngraph;
+
+constexpr VariantTypeInfo VariantWrapper<std::istream*>::type_info;
+
+constexpr VariantTypeInfo VariantWrapper<std::istringstream*>::type_info;
+
+constexpr VariantTypeInfo VariantWrapper<std::shared_ptr<ngraph::runtime::AlignedBuffer>>::type_info;
+
+constexpr VariantTypeInfo VariantWrapper<std::map<std::string, ngraph::OpSet>>::type_info;
\ No newline at end of file
diff --git a/ngraph/frontend/frontend_manager/src/plugin_loader.cpp b/ngraph/frontend/frontend_manager/src/plugin_loader.cpp
index 36100e89882..a69d8dff4a9 100644
--- a/ngraph/frontend/frontend_manager/src/plugin_loader.cpp
+++ b/ngraph/frontend/frontend_manager/src/plugin_loader.cpp
@@ -19,7 +19,7 @@
 #include <string>
 #include <vector>
 
-#include "ngraph/file_util.hpp"
+#include "openvino/util/file_util.hpp"
 #include "plugin_loader.hpp"
 
 using namespace ngraph;
@@ -40,7 +40,7 @@ static std::vector<std::string> list_files(const std::string& path) {
     NGRAPH_SUPPRESS_DEPRECATED_START
     std::vector<std::string> res;
     try {
-        ngraph::file_util::iterate_files(
+        ov::util::iterate_files(
             path,
             [&res](const std::string& file, bool is_dir) {
                 if (!is_dir && file.find("_ngraph_frontend") != std::string::npos) {
diff --git a/ngraph/frontend/ir/CMakeLists.txt b/ngraph/frontend/ir/CMakeLists.txt
index b9c9b3d32ab..65ed33ce562 100644
--- a/ngraph/frontend/ir/CMakeLists.txt
+++ b/ngraph/frontend/ir/CMakeLists.txt
@@ -2,7 +2,7 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
-set(TARGET_NAME "ir_frontend")
+set(TARGET_NAME "ir_ngraph_frontend")
 
 file(GLOB_RECURSE LIBRARY_SRC ${CMAKE_CURRENT_SOURCE_DIR}/src/*.cpp)
 file(GLOB_RECURSE LIBRARY_HEADERS ${CMAKE_CURRENT_SOURCE_DIR}/src/*.hpp)
diff --git a/ngraph/frontend/ir/include/ir_frontend/frontend.hpp b/ngraph/frontend/ir/include/ir_frontend/frontend.hpp
index eba7371fbd3..11da7a7a8dc 100644
--- a/ngraph/frontend/ir/include/ir_frontend/frontend.hpp
+++ b/ngraph/frontend/ir/include/ir_frontend/frontend.hpp
@@ -5,9 +5,7 @@
 #pragma once
 
 #include <frontend_manager/frontend.hpp>
-#include <inference_engine.hpp>
 #include <ngraph/variant.hpp>
-#include <pugixml.hpp>
 
 #include "utility.hpp"
 
@@ -43,38 +41,3 @@ protected:
 
 }  // namespace frontend
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class IR_API VariantWrapper<pugi::xml_node> : public VariantImpl<pugi::xml_node> {
-public:
-    static constexpr VariantTypeInfo type_info{"Variant::pugi::xml_node", 0};
-    const VariantTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
-};
-
-template <>
-class IR_API VariantWrapper<InferenceEngine::Blob::CPtr> : public VariantImpl<InferenceEngine::Blob::CPtr> {
-public:
-    static constexpr VariantTypeInfo type_info{"Variant::Blob::CPtr", 0};
-    const VariantTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
-};
-
-template <>
-class IR_API VariantWrapper<std::vector<InferenceEngine::IExtensionPtr>>
-    : public VariantImpl<std::vector<InferenceEngine::IExtensionPtr>> {
-public:
-    static constexpr VariantTypeInfo type_info{"Variant::Extensions", 0};
-    const VariantTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
-};
-
-}  // namespace ov
diff --git a/ngraph/frontend/ir/include/ir_frontend/model.hpp b/ngraph/frontend/ir/include/ir_frontend/model.hpp
index 1f43c779a77..38c7fe95f31 100644
--- a/ngraph/frontend/ir/include/ir_frontend/model.hpp
+++ b/ngraph/frontend/ir/include/ir_frontend/model.hpp
@@ -5,28 +5,20 @@
 #pragma once
 
 #include <frontend_manager/frontend_manager.hpp>
-#include <inference_engine.hpp>
 #include <ir_frontend/utility.hpp>
+#include <istream>
 #include <memory>
 #include <ngraph/ngraph.hpp>
-#include <pugixml.hpp>
 
 namespace ngraph {
 namespace frontend {
 class IR_API InputModelIR : public InputModel {
     friend class FrontEndIR;
-
-    pugi::xml_node m_root;
-    InferenceEngine::Blob::CPtr m_weights;
-    std::vector<InferenceEngine::IExtensionPtr> m_exts;
+    class InputModelIRImpl;
+    std::shared_ptr<InputModelIRImpl> _impl;
 
 public:
-    explicit InputModelIR(const pugi::xml_node& root,
-                          const InferenceEngine::Blob::CPtr& weights,
-                          const std::vector<InferenceEngine::IExtensionPtr>& exts)
-        : m_root(root),
-          m_weights(weights),
-          m_exts(exts) {}
+    InputModelIR(std::istream& stream, const ov::Weights& weights, const ov::Extensions& extensions);
 
     std::shared_ptr<Function> convert();
 };
diff --git a/ngraph/frontend/ir/include/ir_frontend/utility.hpp b/ngraph/frontend/ir/include/ir_frontend/utility.hpp
index d2ccba48366..a2c95b92616 100644
--- a/ngraph/frontend/ir/include/ir_frontend/utility.hpp
+++ b/ngraph/frontend/ir/include/ir_frontend/utility.hpp
@@ -5,11 +5,11 @@
 #pragma once
 
 // Defined if we are building the plugin DLL (instead of using it)
-#ifdef ir_frontend_EXPORTS
+#ifdef ir_ngraph_frontend_EXPORTS
 #    define IR_API NGRAPH_HELPER_DLL_EXPORT
 #else
 #    define IR_API NGRAPH_HELPER_DLL_IMPORT
-#endif  // ir_frontend_EXPORTS
+#endif  // ir_ngraph_frontend_EXPORTS
 
 #define IR_ASSERT(ex, msg)                 \
     {                                      \
diff --git a/ngraph/frontend/ir/src/frontend.cpp b/ngraph/frontend/ir/src/frontend.cpp
index 2803d804d6d..d047dbd33c3 100644
--- a/ngraph/frontend/ir/src/frontend.cpp
+++ b/ngraph/frontend/ir/src/frontend.cpp
@@ -2,63 +2,202 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
+#include <xml_parse_utils.h>
+
+#include <array>
 #include <ir_frontend/frontend.hpp>
 #include <ir_frontend/model.hpp>
 #include <ir_frontend/utility.hpp>
-#include <map>
 #include <ngraph/variant.hpp>
+#include <openvino/util/file_util.hpp>
 #include <vector>
 
 using namespace ngraph;
 
-namespace ov {
-constexpr VariantTypeInfo VariantWrapper<pugi::xml_node>::type_info;
-constexpr VariantTypeInfo VariantWrapper<InferenceEngine::Blob::CPtr>::type_info;
-constexpr VariantTypeInfo VariantWrapper<std::vector<InferenceEngine::IExtensionPtr>>::type_info;
-}  // namespace ov
-
 namespace ngraph {
 namespace frontend {
 
-bool FrontEndIR::supported_impl(const std::vector<std::shared_ptr<Variant>>& variants) const {
-    // FrontEndIR can only load model specified by xml_node, weights_ptr and vector of extensions
-    if (variants.size() != 3) {
-        return false;
-    }
+inline size_t GetIRVersion(pugi::xml_node& root) {
+    return XMLParseUtils::GetUIntAttr(root, "version", 0);
+}
 
-    bool has_xml_node{false};
-    bool has_weights{false};
-    bool has_exts{false};
+/**
+ * @brief Extracts IR version from model stream
+ * @param model Models stream
+ * @return IR version, 0 if model does represent IR
+ */
+size_t GetIRVersion(std::istream& model) {
+    std::array<char, 512> header{};
 
-    for (const auto& variant : variants) {
-        if (ov::is_type<ov::VariantWrapper<pugi::xml_node>>(variant)) {
-            has_xml_node = true;
-        } else if (ov::is_type<ov::VariantWrapper<InferenceEngine::Blob::CPtr>>(variant)) {
-            has_weights = true;
-        } else if (ov::is_type<ov::VariantWrapper<std::vector<InferenceEngine::IExtensionPtr>>>(variant)) {
-            has_exts = true;
+    model.seekg(0, model.beg);
+    model.read(header.data(), header.size());
+    model.clear();
+    model.seekg(0, model.beg);
+
+    pugi::xml_document doc;
+    auto res =
+        doc.load_buffer(header.data(), header.size(), pugi::parse_default | pugi::parse_fragment, pugi::encoding_utf8);
+
+    if (res == pugi::status_ok) {
+        pugi::xml_node root = doc.document_element();
+
+        std::string node_name = root.name();
+        std::transform(node_name.begin(), node_name.end(), node_name.begin(), ::tolower);
+
+        if (node_name == "net") {
+            return GetIRVersion(root);
         }
+    }
+
+    return 0;
+}
+
+bool FrontEndIR::supported_impl(const std::vector<std::shared_ptr<Variant>>& variants) const {
+    std::ifstream local_model_stream;
+    std::istream* provided_model_stream = nullptr;
+
+    if (variants.empty() || variants.size() > 3) {
         return false;
     }
 
-    return has_xml_node && has_weights && has_exts;
+    const auto& model_variant = variants[0];
+    if (ov::is_type<ov::VariantWrapper<std::string>>(model_variant)) {
+        const auto& path = ov::as_type_ptr<ov::VariantWrapper<std::string>>(model_variant)->get();
+        local_model_stream.open(path, std::ios::in | std::ifstream::binary);
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+    } else if (ov::is_type<ov::VariantWrapper<std::wstring>>(model_variant)) {
+        const auto& path = ov::as_type_ptr<ov::VariantWrapper<std::wstring>>(model_variant)->get();
+        local_model_stream.open(path, std::ios::in | std::ifstream::binary);
+#endif
+    } else if (ov::is_type<ov::VariantWrapper<std::istream*>>(model_variant)) {
+        provided_model_stream = ov::as_type_ptr<ov::VariantWrapper<std::istream*>>(model_variant)->get();
+    } else if (ov::is_type<ov::VariantWrapper<std::istringstream*>>(model_variant)) {
+        provided_model_stream = ov::as_type_ptr<ov::VariantWrapper<std::istringstream*>>(model_variant)->get();
+    }
+
+    if (provided_model_stream && local_model_stream.is_open()) {
+        return false;
+    }
+
+    size_t version;
+    if (provided_model_stream) {
+        version = GetIRVersion(*provided_model_stream);
+    } else if (local_model_stream.is_open()) {
+        version = GetIRVersion(local_model_stream);
+        local_model_stream.close();
+    } else {
+        return false;
+    }
+
+    return version == 10;
 }
 
 InputModel::Ptr FrontEndIR::load_impl(const std::vector<std::shared_ptr<Variant>>& variants) const {
-    pugi::xml_node root;
-    InferenceEngine::Blob::CPtr weights;
-    std::vector<InferenceEngine::IExtensionPtr> exts;
+    std::ifstream local_model_stream;
+    std::istream* provided_model_stream = nullptr;
+    ov::Weights weights;
+    ov::Extensions extensions;
 
-    for (const auto& variant : variants) {
-        if (ov::is_type<ov::VariantWrapper<pugi::xml_node>>(variant)) {
-            root = ov::as_type_ptr<ov::VariantWrapper<pugi::xml_node>>(variant)->get();
-        } else if (ov::is_type<ov::VariantWrapper<InferenceEngine::Blob::CPtr>>(variant)) {
-            weights = ov::as_type_ptr<ov::VariantWrapper<InferenceEngine::Blob::CPtr>>(variant)->get();
-        } else if (ov::is_type<ov::VariantWrapper<std::vector<InferenceEngine::IExtensionPtr>>>(variant)) {
-            exts = ov::as_type_ptr<ov::VariantWrapper<std::vector<InferenceEngine::IExtensionPtr>>>(variant)->get();
+    auto create_input_model = [&]() -> std::shared_ptr<InputModelIR> {
+        if (provided_model_stream) {
+            return std::make_shared<InputModelIR>(*provided_model_stream, weights, extensions);
+        } else if (local_model_stream.is_open()) {
+            auto input_model = std::make_shared<InputModelIR>(local_model_stream, weights, extensions);
+            local_model_stream.close();
+            return input_model;
+        }
+        return nullptr;
+    };
+
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+    std::wstring weights_path, model_path;
+#else
+    std::string weights_path, model_path;
+#endif
+
+    // Load model
+    const auto& model_variant = variants.at(0);
+    if (ov::is_type<ov::VariantWrapper<std::string>>(model_variant)) {
+        const auto& tmp_path = ov::as_type_ptr<ov::VariantWrapper<std::string>>(model_variant)->get();
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+        model_path = ov::util::string_to_wstring(tmp_path.c_str());
+#else
+        model_path = tmp_path;
+#endif
+        local_model_stream.open(model_path, std::ios::in | std::ifstream::binary);
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+    } else if (ov::is_type<ov::VariantWrapper<std::wstring>>(model_variant)) {
+        model_path = ov::as_type_ptr<ov::VariantWrapper<std::wstring>>(model_variant)->get();
+        local_model_stream.open(model_path, std::ios::in | std::ifstream::binary);
+#endif
+    } else if (ov::is_type<ov::VariantWrapper<std::istream*>>(model_variant)) {
+        provided_model_stream = ov::as_type_ptr<ov::VariantWrapper<std::istream*>>(model_variant)->get();
+    } else if (ov::is_type<ov::VariantWrapper<std::istringstream*>>(model_variant)) {
+        provided_model_stream = ov::as_type_ptr<ov::VariantWrapper<std::istringstream*>>(model_variant)->get();
+    }
+
+    // Check weights and extensions
+    for (size_t variant_id = 1; variant_id < variants.size(); ++variant_id) {
+        const auto& variant = variants.at(variant_id);
+        if (ov::is_type<ov::VariantWrapper<std::string>>(variant)) {
+            const auto& tmp_path = ov::as_type_ptr<ov::VariantWrapper<std::string>>(variant)->get();
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+            weights_path = ov::util::string_to_wstring(tmp_path.c_str());
+#else
+            weights_path = tmp_path;
+#endif
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+        } else if (ov::is_type<ov::VariantWrapper<std::wstring>>(variant)) {
+            weights_path = ov::as_type_ptr<ov::VariantWrapper<std::wstring>>(variant)->get();
+#endif
+        } else if (ov::is_type<ov::WeightsVariant>(variant)) {
+            weights = ov::as_type_ptr<ov::WeightsVariant>(variant)->get();
+        } else if (ov::is_type<ov::ExtensionsVariant>(variant)) {
+            extensions = ov::as_type_ptr<ov::ExtensionsVariant>(variant)->get();
         }
     }
-    return std::make_shared<InputModelIR>(root, weights, exts);
+
+    // Find weights if only path to xml was provided
+    if (weights_path.empty()) {
+        auto pos = model_path.rfind('.');
+        if (pos != model_path.npos)
+            weights_path = model_path.substr(0, pos);
+
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+        weights_path += L".bin";
+#else
+        weights_path += ".bin";
+#endif
+        if (!FileUtils::fileExist(weights_path)) {
+            weights_path.clear();
+        }
+    }
+
+    if (!weights_path.empty()) {
+        std::ifstream bin_stream;
+        bin_stream.open(weights_path, std::ios::binary);
+        if (!bin_stream.is_open())
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+            IR_THROW("Weights file " + ov::util::wstring_to_string(weights_path) + " cannot be opened!");
+#else
+            IR_THROW("Weights file " + weights_path + " cannot be opened!");
+#endif
+
+        bin_stream.seekg(0, std::ios::end);
+        size_t file_size = bin_stream.tellg();
+        bin_stream.seekg(0, std::ios::beg);
+
+        auto aligned_weights_buffer = std::make_shared<ngraph::runtime::AlignedBuffer>(file_size);
+        bin_stream.read(aligned_weights_buffer->get_ptr<char>(), aligned_weights_buffer->size());
+        bin_stream.close();
+
+        weights = std::make_shared<runtime::SharedBuffer<std::shared_ptr<runtime::AlignedBuffer>>>(
+            aligned_weights_buffer->get_ptr<char>(),
+            aligned_weights_buffer->size(),
+            aligned_weights_buffer);
+    }
+
+    return create_input_model();
 }
 
 std::shared_ptr<ngraph::Function> FrontEndIR::convert(InputModel::Ptr model) const {
diff --git a/ngraph/frontend/ir/src/model.cpp b/ngraph/frontend/ir/src/model.cpp
index cb677be66e1..940d695fcf1 100644
--- a/ngraph/frontend/ir/src/model.cpp
+++ b/ngraph/frontend/ir/src/model.cpp
@@ -7,7 +7,9 @@
 #include <xml_parse_utils.h>
 
 #include <ie_ngraph_utils.hpp>
+#include <ngraph/opsets/opset1.hpp>
 #include <ngraph_ops/framework_node.hpp>
+#include <pugixml.hpp>
 
 using namespace ngraph;
 using namespace InferenceEngine;
@@ -97,7 +99,7 @@ T stringToType(const std::string& valStr) {
 class XmlDeserializer : public ngraph::AttributeVisitor {
 public:
     explicit XmlDeserializer(const pugi::xml_node& node,
-                             const Blob::CPtr& weights,
+                             const ov::Weights& weights,
                              const std::unordered_map<std::string, ngraph::OpSet>& opsets,
                              std::unordered_map<std::string, std::shared_ptr<ngraph::Variable>>& variables)
         : m_node(node),
@@ -203,7 +205,7 @@ private:
     /// \param node xml node representation
     /// \param weights weights attached to current node
     /// \return shared pointer to function representing input node
-    std::shared_ptr<ngraph::Function> parse_function(const pugi::xml_node& root, const Blob::CPtr& weights);
+    std::shared_ptr<ngraph::Function> parse_function(const pugi::xml_node& root, const ov::Weights& weights);
     /// \brief Traverses xml node representation in order to get the purpose attribute of
     /// inputs/outputs in the body of Loop op. \param node xml node representation \return struct
     /// with value of purpuse attribute
@@ -213,12 +215,12 @@ private:
 
     std::shared_ptr<ngraph::Node> createNode(const ngraph::OutputVector& inputs,
                                              const pugi::xml_node& node,
-                                             const Blob::CPtr& weights,
+                                             const ov::Weights& weights,
                                              const GenericLayerParams& params);
 
     // -- DATA --
     const pugi::xml_node m_node;
-    const Blob::CPtr& m_weights;
+    const ov::Weights& m_weights;
     const std::unordered_map<std::string, ngraph::OpSet>& m_opsets;
     std::unordered_map<std::string, std::shared_ptr<ngraph::Variable>>& m_variables;
 
@@ -531,18 +533,16 @@ void XmlDeserializer::on_adapter(const std::string& name, ngraph::ValueAccessor<
 
             ngraph::element::Type el_type = details::convertPrecision(el_type_str);
 
-            size_t length = m_weights->byteSize();
-            if (!length)
+            if (!m_weights)
                 IE_THROW() << "Empty weights data in bin file or bin file cannot be found!";
-            if (length < offset + size)
+            if (m_weights->size() < offset + size)
                 IE_THROW() << "Incorrect weights in bin file!";
             if (size < std::ceil(ngraph::shape_size(shape) * el_type.bitwidth() / 8.f))
                 IE_THROW() << "Attribute and shape size are inconsistent for " << type << " op!";
 
-            char* data = m_weights->cbuffer().as<char*>() + offset;
-
-            using SharedBuffer = ngraph::runtime::SharedBuffer<const Blob::CPtr>;
-            auto buffer = std::make_shared<SharedBuffer>(data, size, m_weights);
+            char* data = m_weights->get_ptr<char>() + offset;
+            auto buffer =
+                std::make_shared<runtime::SharedBuffer<std::shared_ptr<runtime::AlignedBuffer>>>(data, size, m_weights);
             a->set(buffer);
         }
     } else if (auto a = ngraph::as_type<ngraph::AttributeAdapter<ngraph::op::FrameworkNodeAttrs>>(&adapter)) {
@@ -590,7 +590,7 @@ void XmlDeserializer::on_adapter(const std::string& name,
 }
 
 std::shared_ptr<ngraph::Function> XmlDeserializer::parse_function(const pugi::xml_node& root,
-                                                                  const Blob::CPtr& weights) {
+                                                                  const ov::Weights& weights) {
     // OV_ITT_SCOPE_CHAIN(FIRST_INFERENCE, taskChain, itt::domains::V10Reader_RT, "V10Parser", "Parse");
 
     struct FunctionNodes {
@@ -660,8 +660,11 @@ std::shared_ptr<ngraph::Function> XmlDeserializer::parse_function(const pugi::xm
     //  Following topological order create nGraph operations
     for (auto& layer_id : order) {
         auto& p = params[layer_id];
-        ngraph::OutputVector inputs(edges[layer_id].size());
-        for (auto& e : edges[layer_id]) {
+        const auto& edgeIt = edges.find(layer_id);
+        if (edgeIt == edges.end())
+            continue;
+        ngraph::OutputVector inputs(edgeIt->second.size());
+        for (auto& e : edgeIt->second) {
             auto input_node = id_to_node[e.fromLayerId];
             if (!input_node) {
                 IE_THROW() << "Attempt to access node " << e.fromLayerId << " that not in graph.";
@@ -791,7 +794,7 @@ GenericLayerParams XmlDeserializer::parseGenericParams(const pugi::xml_node& nod
 
 std::shared_ptr<ngraph::Node> XmlDeserializer::createNode(const std::vector<ngraph::Output<ngraph::Node>>& inputs,
                                                           const pugi::xml_node& node,
-                                                          const Blob::CPtr& weights,
+                                                          const ov::Weights& weights,
                                                           const GenericLayerParams& params) {
     // Check that inputs are correctly defined
     for (size_t i = 0; i < inputs.size(); i++) {
@@ -899,11 +902,211 @@ std::shared_ptr<ngraph::Node> XmlDeserializer::createNode(const std::vector<ngra
     return ngraphNode;
 }
 
+void ParsePreProcess(pugi::xml_node& root, ov::Weights weights, std::shared_ptr<Function> f) {
+    /* Preprocessing block can have two preprocessing types:
+     *
+     * <pre-process mean-precision="FP32" reference-layer-name="data">
+     *     <channel id="0">
+     *         <mean value="1.1"/>
+     *     </channel>
+     * </pre-process>
+     *
+     * OR
+     *
+     * <pre-process mean-precision="FP32" reference-layer-name="data">
+     *     <channel id="0">
+     *         <mean offset="0" size="1936"/>
+     *     </channel>
+     * </pre-process>
+     */
+
+    auto ppNode = root.child("pre-process");
+    if (ppNode.empty()) {
+        return;
+    }
+    // find out to what input this belongs to
+    std::string inputName;
+    std::shared_ptr<Node> input_node;
+
+    inputName = XMLParseUtils::GetStrAttr(ppNode, "reference-layer-name", "");
+    inputName = trim(inputName);
+
+    if (inputName.empty()) {
+        // fallback (old format), look for the picture in the inputs
+        for (const auto& parameter : f->get_parameters()) {
+            if (parameter->get_partial_shape().rank().is_static() &&
+                parameter->get_partial_shape().rank().get_length() == 4) {
+                input_node = parameter;
+                break;
+            }
+        }
+
+        IE_ASSERT(!f->get_parameters().empty());
+        if (!input_node) {
+            input_node = f->get_parameters()[0];
+        }
+
+        inputName = input_node->get_friendly_name();
+    } else {
+        for (const auto& parameter : f->get_parameters()) {
+            if (parameter->get_friendly_name() == inputName) {
+                input_node = parameter;
+                break;
+            }
+        }
+    }
+
+    if (!input_node)
+        IE_THROW() << "pre-process name ref '" << inputName << "' refers to un-existing input";
+
+    const auto& input_shape = input_node->output(0).get_partial_shape();
+    if (input_shape.is_dynamic()) {
+        IE_THROW() << "can not apply pre-process for '" << inputName << "' input";
+    }
+
+    Shape mean_scalar_shape;  // [C, 1 ... 1]
+    Shape mean_shape;         // [1, H, W] - for 4D case
+
+    const auto inputDims = input_shape.to_shape();
+
+    if (inputDims.size() < 2) {
+        IE_THROW() << "network did not define input dimensions properly";
+    } else if (inputDims.size() == 2) {  // NC
+        mean_scalar_shape = {inputDims[1]};
+        mean_shape = {1};
+    } else if (inputDims.size() == 3) {  // CHW - legacy representation for 3D input shape
+        mean_scalar_shape = {inputDims[0], 1, 1};
+        mean_shape = {1, inputDims[1], inputDims[2]};
+    } else if (inputDims.size() == 4) {  // NCHW
+        mean_scalar_shape = {inputDims[1], 1, 1};
+        mean_shape = {1, inputDims[2], inputDims[3]};
+    } else if (inputDims.size() == 5) {  // NCDHW
+        mean_scalar_shape = {inputDims[1], 1, 1, 1};
+        mean_shape = {1, inputDims[2], inputDims[3], inputDims[4]};
+    }
+    const int64_t channels = mean_scalar_shape[0];
+
+    int64_t next_channel_id{0};
+    std::set<std::pair<int64_t, float>> mean_scalar_values;
+    std::set<std::pair<int64_t, std::pair<int64_t, int64_t>>> mean_values;
+
+    auto input_type = input_node->get_output_element_type(0);
+    FOREACH_CHILD (chan, ppNode, "channel") {
+        int chanNo = XMLParseUtils::GetIntAttr(chan, "id", next_channel_id++);
+
+        auto meanNode = chan.child("mean");
+        if (!meanNode.empty()) {
+            if (!meanNode.attribute("value") && (!meanNode.attribute("size"))) {
+                IE_THROW() << "mean should have at least one of the following attribute: value, size";
+            }
+            if (meanNode.attribute("value")) {
+                mean_scalar_values.insert({chanNo, XMLParseUtils::GetFloatAttr(meanNode, "value")});
+            }
+            if (meanNode.attribute("size") && meanNode.attribute("offset")) {
+                auto const_size = XMLParseUtils::GetIntAttr(meanNode, "size");
+                auto const_offset = XMLParseUtils::GetIntAttr(meanNode, "offset");
+                if (shape_size(mean_shape) * input_type.size() != const_size) {
+                    IE_THROW() << "mean blob size mismatch expected input, got: " << const_size << " expecting "
+                               << mean_shape << " x " << input_type.size();
+                }
+                if (const_offset + const_size > weights->size()) {
+                    IE_THROW() << "mean value offset and size are out of weights size range";
+                }
+                mean_values.insert({chanNo, {const_size, const_offset}});
+            }
+        }
+    }
+
+    if (!mean_values.empty() && !mean_scalar_values.empty()) {
+        IE_THROW() << "mean values have different types";
+    }
+
+    if (!mean_scalar_values.empty()) {
+        if (mean_scalar_values.size() != channels) {
+            IE_THROW() << "Number of mean values (" << mean_scalar_values.size()
+                       << ") is not equal to number of channels (" << channels << ")";
+        }
+        std::vector<float> values(channels);
+        for (const auto& item : mean_scalar_values) {
+            if (item.first >= channels) {
+                IE_THROW() << "Mean values channel index " << item.first << " is out of range (" << channels << ")";
+            }
+            values[item.first] = item.second;
+        }
+        auto mean_values_constant = ngraph::op::Constant::create(input_type, mean_scalar_shape, values);
+
+        const auto& consumers = input_node->output(0).get_target_inputs();
+        auto add = std::make_shared<ngraph::opset1::Subtract>(input_node, mean_values_constant);
+        for (const auto& consumer : consumers) {
+            consumer.replace_source_output(add);
+        }
+    }
+
+    if (!mean_values.empty()) {
+        if (mean_values.size() != channels) {
+            IE_THROW() << "Number of mean values (" << mean_values.size() << ") is not equal to number of channels ("
+                       << channels << ")";
+        }
+        NodeVector per_channel_values(channels);
+        for (const auto& item : mean_values) {
+            if (item.first >= channels) {
+                IE_THROW() << "Mean values channel index " << item.first << " is out of range (" << channels << ")";
+            }
+            const size_t offset = item.second.second;
+            const char* data = weights->get_ptr<char>() + offset;
+            per_channel_values[item.first] = ngraph::opset1::Constant::create(input_type, mean_shape, data);
+        }
+        auto const_node = get_constant_from_source(std::make_shared<ngraph::opset1::Concat>(per_channel_values, 0));
+        IE_ASSERT(const_node);
+        const auto& consumers = input_node->output(0).get_target_inputs();
+        auto add = std::make_shared<ngraph::opset1::Subtract>(input_node, const_node);
+        for (const auto& consumer : consumers) {
+            consumer.replace_source_output(add);
+        }
+    }
+}
+
 }  // namespace
 
 namespace ngraph {
 namespace frontend {
+
+namespace {
+void loadXml(pugi::xml_document& xmlDoc, std::istream& model) {
+    // OV_ITT_SCOPE(FIRST_INFERENCE, itt::domains::V10Reader_RT, "loadXml");
+    pugi::xml_parse_result res = xmlDoc.load(model);
+    if (res.status != pugi::status_ok) {
+        IE_THROW() << res.description() << "at offset " << res.offset;
+    }
+}
+}  // namespace
+
+class InputModelIR::InputModelIRImpl {
+    ov::Weights m_weights;
+    ov::Extensions m_extensions;
+    pugi::xml_node m_root;
+    pugi::xml_document m_xml_doc;
+
+public:
+    InputModelIRImpl(std::istream& stream, const ov::Weights& weights, const ov::Extensions& extensions)
+        : m_weights(weights),
+          m_extensions(extensions) {
+        loadXml(m_xml_doc, stream);
+        m_root = m_xml_doc.document_element();
+    }
+
+    std::shared_ptr<Function> convert();
+};
+
+InputModelIR::InputModelIR(std::istream& stream, const ov::Weights& weights, const ov::Extensions& extensions) {
+    _impl = std::make_shared<InputModelIRImpl>(stream, weights, extensions);
+}
+
 std::shared_ptr<Function> InputModelIR::convert() {
+    return _impl->convert();
+}
+
+std::shared_ptr<Function> InputModelIR::InputModelIRImpl::convert() {
     std::unordered_map<std::string, ngraph::OpSet> opsets;
     std::unordered_map<std::string, std::shared_ptr<ngraph::Variable>> variables;
 
@@ -918,29 +1121,19 @@ std::shared_ptr<Function> InputModelIR::convert() {
     opsets["opset8"] = ngraph::get_opset8();
 
     // Load custom opsets
-    for (const auto& ext : m_exts) {
-        for (const auto& it : ext->getOpSets()) {
-            if (opsets.find(it.first) != opsets.end())
-                IE_THROW() << "Cannot add opset with name: " << it.first
-                           << ". Opset with the same name already exists.";
-            opsets[it.first] = it.second;
-        }
+    for (const auto& it : m_extensions) {
+        if (opsets.find(it.first) != opsets.end())
+            IE_THROW() << "Cannot add opset with name: " << it.first << ". Opset with the same name already exists.";
+        opsets[it.first] = it.second;
     }
 
     XmlDeserializer visitor(m_root, m_weights, opsets, variables);
-    bool use_framework_node{false};
-    for (const auto& ext : m_exts) {
-        const InferenceEngine::Version* version = nullptr;
-        ext->GetVersion(version);
-        if (version && version->description && strcmp(version->description, "framework_node_ext") == 0) {
-            use_framework_node = true;
-            break;
-        }
-    }
-    visitor.use_framework_node(use_framework_node);
-
+    visitor.use_framework_node(opsets.count("framework_node_ext"));
     std::shared_ptr<ngraph::Function> function;
     visitor.on_attribute("net", function);
+
+    ParsePreProcess(m_root, m_weights, function);
+
     return function;
 }
 }  // namespace frontend
diff --git a/ngraph/frontend/onnx/frontend/CMakeLists.txt b/ngraph/frontend/onnx/frontend/CMakeLists.txt
index 72838ee735e..43c3e4b362e 100644
--- a/ngraph/frontend/onnx/frontend/CMakeLists.txt
+++ b/ngraph/frontend/onnx/frontend/CMakeLists.txt
@@ -46,7 +46,7 @@ if(COMMAND ie_add_vs_version_file)
                            FILEDESCRIPTION "nGraph ONNX frontend library")
 endif()
 
-target_link_libraries(${TARGET_NAME} PUBLIC ngraph PRIVATE frontend_manager ngraph::builder onnx_common inference_engine_transformations)
+target_link_libraries(${TARGET_NAME} PUBLIC ngraph PRIVATE frontend_manager ngraph::builder openvino::util onnx_common inference_engine_transformations)
 
 target_include_directories(${TARGET_NAME} PUBLIC $<BUILD_INTERFACE:${ONNX_FRONTEND_INCLUDE_DIR}>
                                                 $<INSTALL_INTERFACE:${FRONTEND_INSTALL_INCLUDE}>)
diff --git a/ngraph/frontend/onnx/frontend/src/utils/tensor_external_data.cpp b/ngraph/frontend/onnx/frontend/src/utils/tensor_external_data.cpp
index e0bc8fd33fd..71f51ff1e2e 100644
--- a/ngraph/frontend/onnx/frontend/src/utils/tensor_external_data.cpp
+++ b/ngraph/frontend/onnx/frontend/src/utils/tensor_external_data.cpp
@@ -10,6 +10,7 @@
 #include "exceptions.hpp"
 #include "ngraph/file_util.hpp"
 #include "ngraph/log.hpp"
+#include "openvino/util/file_util.hpp"
 
 namespace ngraph {
 namespace onnx_import {
@@ -30,7 +31,7 @@ TensorExternalData::TensorExternalData(const ONNX_NAMESPACE::TensorProto& tensor
 std::string TensorExternalData::load_external_data() const {
     NGRAPH_SUPPRESS_DEPRECATED_START
 #if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
-    std::wstring path = file_util::multi_byte_char_to_wstring(m_data_location.c_str());
+    std::wstring path = ov::util::string_to_wstring(m_data_location);
 #else
     std::string path = m_data_location;
 #endif
diff --git a/ngraph/frontend/paddlepaddle/src/default_opset.hpp b/ngraph/frontend/paddlepaddle/src/default_opset.hpp
new file mode 100644
index 00000000000..4a7aa3259c6
--- /dev/null
+++ b/ngraph/frontend/paddlepaddle/src/default_opset.hpp
@@ -0,0 +1,16 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "ngraph/opsets/opset8.hpp"
+
+namespace ngraph {
+namespace frontend {
+namespace pdpd {
+namespace op {
+namespace default_opset = ngraph::opset8;
+
+}  // namespace op
+}  // namespace pdpd
+}  // namespace frontend
+}  // namespace ngraph
diff --git a/ngraph/frontend/paddlepaddle/src/op/cumsum.cpp b/ngraph/frontend/paddlepaddle/src/op/cumsum.cpp
new file mode 100644
index 00000000000..56a3a12707e
--- /dev/null
+++ b/ngraph/frontend/paddlepaddle/src/op/cumsum.cpp
@@ -0,0 +1,37 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <node_context.hpp>
+
+#include "default_opset.hpp"
+
+namespace ngraph {
+namespace frontend {
+namespace pdpd {
+namespace op {
+NamedOutputs cumsum(const NodeContext& node) {
+    const auto x = node.get_ng_input("X");
+    const auto axis = node.get_attribute<int32_t>("axis", -1);
+    const auto flatten = node.get_attribute<bool>("flatten", false);
+    const auto reverse = node.get_attribute<bool>("reverse", false);
+    const auto exclusive = node.get_attribute<bool>("exclusive", false);
+
+    std::shared_ptr<ngraph::Node> input = x.get_node_shared_ptr();
+    if (flatten) {
+        // convert to 1-d tensor
+        input = std::make_shared<default_opset::Reshape>(x,
+                                                         default_opset::Constant::create(element::i64, {1}, {-1}),
+                                                         false);
+    }
+
+    const auto axis_node = default_opset::Constant::create(element::i64, {}, {axis});
+    return node.default_single_output_mapping(
+        {std::make_shared<default_opset::CumSum>(input, axis_node, exclusive, reverse)},
+        {"Out"});
+}
+
+}  // namespace op
+}  // namespace pdpd
+}  // namespace frontend
+}  // namespace ngraph
diff --git a/ngraph/frontend/paddlepaddle/src/op/embedding.cpp b/ngraph/frontend/paddlepaddle/src/op/embedding.cpp
new file mode 100644
index 00000000000..a8387dd62b4
--- /dev/null
+++ b/ngraph/frontend/paddlepaddle/src/op/embedding.cpp
@@ -0,0 +1,55 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <ngraph/opsets/opset8.hpp>
+#include <node_context.hpp>
+
+namespace ngraph {
+namespace frontend {
+namespace pdpd {
+namespace op {
+using namespace opset8;
+using namespace element;
+
+NamedOutputs embedding(const NodeContext& node) {
+    auto data_ids = node.get_ng_input("Ids");
+    auto data_w = node.get_ng_input("W");
+
+    auto padding_idx = node.get_attribute<int64_t>("padding_idx");
+
+    const auto const_axis0 = Constant::create<int32_t>(i64, {1}, {0});
+
+    std::shared_ptr<Node> node_embedding;
+    if (padding_idx < 0)  // no mask
+    {
+        node_embedding = std::make_shared<Gather>(data_w, data_ids, const_axis0);
+    } else {  // mask embedding
+        auto node_shape_of_w = std::make_shared<ShapeOf>(data_w);
+        auto node_vocab_size = std::make_shared<Gather>(node_shape_of_w,
+                                                        Constant::create<int64_t>(i64, {1}, {0}),
+                                                        const_axis0);  // vocab_size
+        auto node_stop = std::make_shared<Squeeze>(node_vocab_size);
+
+        auto node_range = std::make_shared<Range>(Constant::create<int64_t>(i64, {}, {0}),
+                                                  node_stop,
+                                                  Constant::create<int64_t>(i64, {}, {1}),
+                                                  i64);
+
+        auto node_equal = std::make_shared<Equal>(node_range, Constant::create(i64, {1}, {padding_idx}));
+        auto node_mask = std::make_shared<Unsqueeze>(node_equal, Constant::create<int64_t>(i64, {1}, {1}));
+
+        data_w = std::make_shared<Select>(node_mask,
+                                          Constant::create<float>(f32, {1}, {0}),
+                                          data_w,
+                                          ov::op::AutoBroadcastType::NUMPY);  // masked W
+
+        node_embedding = std::make_shared<Gather>(data_w, data_ids, const_axis0);
+    }
+
+    return node.default_single_output_mapping({node_embedding}, {"Out"});
+}
+}  // namespace op
+}  // namespace pdpd
+}  // namespace frontend
+}  // namespace ngraph
diff --git a/ngraph/frontend/paddlepaddle/src/op/fill_any_like.cpp b/ngraph/frontend/paddlepaddle/src/op/fill_any_like.cpp
new file mode 100644
index 00000000000..2a7e9f3facd
--- /dev/null
+++ b/ngraph/frontend/paddlepaddle/src/op/fill_any_like.cpp
@@ -0,0 +1,37 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <node_context.hpp>
+
+#include "default_opset.hpp"
+
+namespace ngraph {
+namespace frontend {
+namespace pdpd {
+namespace op {
+NamedOutputs fill_any_like(const NodeContext& node) {
+    const auto x = node.get_ng_input("X");
+    auto dtype = node.get_attribute<ngraph::element::Type>("dtype", element::undefined);
+    const auto value = node.get_attribute<float>("value");
+    if (dtype == element::undefined) {
+        // when type does not define, use the input type
+        dtype = x.get_element_type();
+    }
+    const auto supported_type = {element::i32, element::i64, element::f16, element::f32, element::f64};
+    const bool valid_type =
+        std::any_of(supported_type.begin(), supported_type.end(), [dtype](const element::Type& type) {
+            return dtype == type;
+        });
+    PDPD_ASSERT(valid_type, "fill_any_like only supports i32, i64, f16, f32, f64");
+    const auto value_node = default_opset::Constant::create(dtype, {1}, {value});
+    const auto shape_node = std::make_shared<default_opset::ShapeOf>(x);
+
+    return node.default_single_output_mapping({std::make_shared<default_opset::Broadcast>(value_node, shape_node)},
+                                              {"Out"});
+}
+
+}  // namespace op
+}  // namespace pdpd
+}  // namespace frontend
+}  // namespace ngraph
diff --git a/ngraph/frontend/paddlepaddle/src/op/gelu.cpp b/ngraph/frontend/paddlepaddle/src/op/gelu.cpp
new file mode 100644
index 00000000000..496a037b912
--- /dev/null
+++ b/ngraph/frontend/paddlepaddle/src/op/gelu.cpp
@@ -0,0 +1,23 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <node_context.hpp>
+
+#include "default_opset.hpp"
+
+namespace ngraph {
+namespace frontend {
+namespace pdpd {
+namespace op {
+NamedOutputs gelu(const NodeContext& node) {
+    const auto data = node.get_ng_input("X");
+    const auto approximate = node.get_attribute<bool>("approximate", false);
+    const auto mode = approximate ? ngraph::op::GeluApproximationMode::TANH : ngraph::op::GeluApproximationMode::ERF;
+
+    return node.default_single_output_mapping({std::make_shared<default_opset::Gelu>(data, mode)}, {"Out"});
+}
+}  // namespace op
+}  // namespace pdpd
+}  // namespace frontend
+}  // namespace ngraph
\ No newline at end of file
diff --git a/ngraph/frontend/paddlepaddle/src/op/layer_norm.cpp b/ngraph/frontend/paddlepaddle/src/op/layer_norm.cpp
new file mode 100644
index 00000000000..4dda7426f45
--- /dev/null
+++ b/ngraph/frontend/paddlepaddle/src/op/layer_norm.cpp
@@ -0,0 +1,59 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <node_context.hpp>
+
+#include "default_opset.hpp"
+
+namespace ngraph {
+namespace frontend {
+namespace pdpd {
+namespace op {
+NamedOutputs layer_norm(const NodeContext& node) {
+    using namespace default_opset;
+    const auto data = node.get_ng_input("X");
+    const auto epsilon = node.get_attribute<float>("epsilon", 1e-05);
+    const auto begin_norm_axis = node.get_attribute<int32_t>("begin_norm_axis", 1);
+    // The limitation from:
+    // https://github.com/PaddlePaddle/Paddle/blob/cec36ea6ff16fda90c1a004c6e043cd9b2096a2a/paddle/fluid/operators/layer_norm_op.cc#L176
+    PDPD_ASSERT(begin_norm_axis > 0, "begin_norm_axis should be greater than 0");
+
+    // shape of input
+    const auto shape_of_node = std::make_shared<ShapeOf>(data);
+    // dims of input, reduce to scalar
+    const auto dims_node = std::make_shared<ReduceMin>(std::make_shared<ShapeOf>(shape_of_node),
+                                                       Constant::create(element::i64, {1}, {0}),
+                                                       false);
+    // get axis list to do the computation: [begin_norm_axis: dims)
+    const auto axis = std::make_shared<Range>(Constant::create(element::i64, {}, {begin_norm_axis}),
+                                              dims_node,
+                                              Constant::create(element::i64, {}, {1}),
+                                              element::i64);
+    // 'Scale' and 'Bias' are in plain, shoule get the real shape. The shape: shape_of_node[begin_norm_axis:-1]
+    const auto scale_bias_shape = std::make_shared<StridedSlice>(shape_of_node,
+                                                                 Constant::create(element::i64, {1}, {begin_norm_axis}),
+                                                                 Constant::create(element::i64, {1}, {0}),
+                                                                 std::vector<int64_t>{0},
+                                                                 std::vector<int64_t>{1});
+
+    const auto mvn = std::make_shared<MVN>(data, axis, true, epsilon, ngraph::op::MVNEpsMode::INSIDE_SQRT);
+    std::shared_ptr<ngraph::Node> result = mvn;
+    if (node.has_ng_input("Scale")) {
+        const auto s = node.get_ng_input("Scale");
+        const auto reshaped_s = std::make_shared<Reshape>(s, scale_bias_shape, false);
+        result = std::make_shared<Multiply>(mvn, reshaped_s);
+    }
+
+    if (node.has_ng_input("Bias")) {
+        const auto b = node.get_ng_input("Bias");
+        const auto reshaped_b = std::make_shared<Reshape>(b, scale_bias_shape, false);
+        result = std::make_shared<Add>(result, reshaped_b);
+    }
+
+    return node.default_single_output_mapping({result}, {"Y"});
+}
+}  // namespace op
+}  // namespace pdpd
+}  // namespace frontend
+}  // namespace ngraph
\ No newline at end of file
diff --git a/ngraph/frontend/paddlepaddle/src/op/matmul_v2.cpp b/ngraph/frontend/paddlepaddle/src/op/matmul_v2.cpp
new file mode 100644
index 00000000000..2ecd053f156
--- /dev/null
+++ b/ngraph/frontend/paddlepaddle/src/op/matmul_v2.cpp
@@ -0,0 +1,24 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+#include <node_context.hpp>
+
+#include "default_opset.hpp"
+
+namespace ngraph {
+namespace frontend {
+namespace pdpd {
+namespace op {
+NamedOutputs matmul_v2(const NodeContext& node) {
+    const auto x = node.get_ng_input("X");
+    const auto y = node.get_ng_input("Y");
+    const auto transpose_a = node.get_attribute<bool>("trans_x", false);
+    const auto transpose_b = node.get_attribute<bool>("trans_y", false);
+    const auto mm = std::make_shared<default_opset::MatMul>(x, y, transpose_a, transpose_b);
+    return node.default_single_output_mapping({mm}, {"Out"});
+}
+
+}  // namespace op
+}  // namespace pdpd
+}  // namespace frontend
+}  // namespace ngraph
\ No newline at end of file
diff --git a/ngraph/frontend/paddlepaddle/src/op/tanh.cpp b/ngraph/frontend/paddlepaddle/src/op/tanh.cpp
new file mode 100644
index 00000000000..11b666cff8c
--- /dev/null
+++ b/ngraph/frontend/paddlepaddle/src/op/tanh.cpp
@@ -0,0 +1,22 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <node_context.hpp>
+
+#include "default_opset.hpp"
+
+namespace ngraph {
+namespace frontend {
+namespace pdpd {
+namespace op {
+NamedOutputs tanh(const NodeContext& node) {
+    const auto x = node.get_ng_input("X");
+
+    return node.default_single_output_mapping({std::make_shared<default_opset::Tanh>(x)}, {"Out"});
+}
+
+}  // namespace op
+}  // namespace pdpd
+}  // namespace frontend
+}  // namespace ngraph
diff --git a/ngraph/frontend/paddlepaddle/src/op_table.cpp b/ngraph/frontend/paddlepaddle/src/op_table.cpp
index 5dc33ded94c..e6c4106b12b 100644
--- a/ngraph/frontend/paddlepaddle/src/op_table.cpp
+++ b/ngraph/frontend/paddlepaddle/src/op_table.cpp
@@ -17,6 +17,7 @@ OP_CONVERTER(clip);
 OP_CONVERTER(concat);
 OP_CONVERTER(conv2d);
 OP_CONVERTER(conv2d_transpose);
+OP_CONVERTER(cumsum);
 OP_CONVERTER(deformable_conv);
 OP_CONVERTER(dropout);
 OP_CONVERTER(elementwise_add);
@@ -28,16 +29,21 @@ OP_CONVERTER(elementwise_min);
 OP_CONVERTER(elementwise_mul);
 OP_CONVERTER(elementwise_pow);
 OP_CONVERTER(elementwise_sub);
+OP_CONVERTER(embedding);
 OP_CONVERTER(expand_v2);
+OP_CONVERTER(fill_any_like);
 OP_CONVERTER(fill_constant_batch_size_like);
 OP_CONVERTER(fill_constant);
 OP_CONVERTER(flatten_contiguous_range);
+OP_CONVERTER(gelu);
 OP_CONVERTER(hard_sigmoid);
 OP_CONVERTER(hard_swish);
+OP_CONVERTER(layer_norm);
 OP_CONVERTER(leaky_relu);
 OP_CONVERTER(log);
 OP_CONVERTER(logical_not);
 OP_CONVERTER(matmul);
+OP_CONVERTER(matmul_v2);
 OP_CONVERTER(mul);
 OP_CONVERTER(matrix_nms);
 OP_CONVERTER(multiclass_nms);
@@ -57,6 +63,7 @@ OP_CONVERTER(softmax);
 OP_CONVERTER(sigmoid);
 OP_CONVERTER(split);
 OP_CONVERTER(squeeze);
+OP_CONVERTER(tanh);
 OP_CONVERTER(transpose2);
 OP_CONVERTER(unsqueeze);
 OP_CONVERTER(yolo_box);
@@ -80,6 +87,7 @@ std::map<std::string, CreatorFunction> get_supported_ops() {
             {"concat", op::concat},
             {"conv2d", op::conv2d},
             {"conv2d_transpose", op::conv2d_transpose},
+            {"cumsum", op::cumsum},
             {"deformable_conv", op::deformable_conv},
             {"deformable_conv_v1", op::deformable_conv},
             {"depthwise_conv2d", op::conv2d},
@@ -94,16 +102,21 @@ std::map<std::string, CreatorFunction> get_supported_ops() {
             {"elementwise_sub", op::elementwise_sub},
             {"equal", op::elementwise_equal},
             {"expand_v2", op::expand_v2},
+            {"fill_any_like", op::fill_any_like},
             {"fill_constant_batch_size_like", op::fill_constant_batch_size_like},
             {"fill_constant", op::fill_constant},
             {"flatten_contiguous_range", op::flatten_contiguous_range},
+            {"gelu", op::gelu},
             {"greater_equal", op::elementwise_greater_equal},
             {"hard_sigmoid", op::hard_sigmoid},
             {"hard_swish", op::hard_swish},
+            {"layer_norm", op::layer_norm},
             {"leaky_relu", op::leaky_relu},
             {"log", op::log},
             {"logical_not", op::logical_not},
+            {"lookup_table_v2", op::embedding},
             {"matmul", op::matmul},
+            {"matmul_v2", op::matmul_v2},
             {"max_pool2d_with_index", op::pool2d},
             {"mul", op::mul},
             {"matrix_nms", op::matrix_nms},
@@ -126,6 +139,7 @@ std::map<std::string, CreatorFunction> get_supported_ops() {
             {"split", op::split},
             {"squeeze2", op::squeeze},
             {"sync_batch_norm", op::batch_norm},
+            {"tanh", op::tanh},
             {"transpose2", op::transpose2},
             {"unsqueeze2", op::unsqueeze},
             {"yolo_box", op::yolo_box}};
diff --git a/ngraph/test/CMakeLists.txt b/ngraph/test/CMakeLists.txt
index 40592a8164a..c9c7aa79128 100644
--- a/ngraph/test/CMakeLists.txt
+++ b/ngraph/test/CMakeLists.txt
@@ -49,6 +49,7 @@ set(SRC
     matcher_pass.cpp
     misc.cpp
     node_input_output.cpp
+    rtti.cpp
     op.cpp
     opset.cpp
     op_eval/binary_convolution.cpp
@@ -86,6 +87,8 @@ set(SRC
     span.cpp
     specialize_function.cpp
     tensor.cpp
+    threading.cpp
+    type_info.cpp
     type_prop/abs.cpp
     type_prop/acos.cpp
     type_prop/adaptive_avg_pool.cpp
diff --git a/ngraph/test/frontend/paddlepaddle/op_fuzzy.cpp b/ngraph/test/frontend/paddlepaddle/op_fuzzy.cpp
index b2ec2b0668e..bad85f041e7 100644
--- a/ngraph/test/frontend/paddlepaddle/op_fuzzy.cpp
+++ b/ngraph/test/frontend/paddlepaddle/op_fuzzy.cpp
@@ -63,6 +63,11 @@ static const std::vector<std::string> models{std::string("argmax"),
                                              std::string("conv2d_transpose_strides_padding"),
                                              std::string("conv2d_transpose_VALID_padding"),
                                              std::string("conv2d_VALID_padding"),
+                                             std::string("cumsum"),
+                                             std::string("cumsum_i32"),
+                                             std::string("cumsum_i64"),
+                                             std::string("cumsum_f32"),
+                                             std::string("cumsum_f64"),
                                              std::string("depthwise_conv2d_convolution"),
                                              std::string("depthwise_conv2d_transpose_convolution"),
                                              std::string("dropout"),
@@ -74,10 +79,23 @@ static const std::vector<std::string> models{std::string("argmax"),
                                              std::string("elementwise_mul1"),
                                              std::string("elementwise_pow1"),
                                              std::string("elementwise_sub1"),
+                                             std::string("embedding_0"),
+                                             std::string("embedding_sparse"),
+                                             std::string("embedding_none_weight"),
+                                             std::string("embedding_paddings"),
+                                             std::string("embedding_paddings_neg1"),
+                                             std::string("embedding_tensorIds"),
+                                             std::string("embedding_tensorIds_paddings"),
                                              std::string("equal"),
                                              std::string("expand_v2"),
                                              std::string("expand_v2_tensor"),
                                              std::string("expand_v2_tensor_list"),
+                                             std::string("fill_any_like"),
+                                             std::string("fill_any_like_f16"),
+                                             std::string("fill_any_like_f32"),
+                                             std::string("fill_any_like_f64"),
+                                             std::string("fill_any_like_i32"),
+                                             std::string("fill_any_like_i64"),
                                              std::string("fill_constant"),
                                              std::string("fill_constant_batch_size_like"),
                                              std::string("fill_constant_int32"),
@@ -86,18 +104,31 @@ static const std::vector<std::string> models{std::string("argmax"),
                                              std::string("fill_constant_shape_tensor"),
                                              std::string("fill_constant_shape_tensor_list"),
                                              std::string("flatten_contiguous_range_test1"),
+                                             std::string("gelu_erf"),
+                                             std::string("gelu_tanh"),
                                              // greater_equal_big_int64(failure due to CPU inference),
                                              std::string("greater_equal_float32"),
                                              std::string("greater_equal_int32"),
                                              std::string("greater_equal_int64"),
                                              std::string("hard_sigmoid"),
                                              std::string("hard_swish"),
+                                             std::string("layer_norm"),
+                                             std::string("layer_norm_noall"),
+                                             std::string("layer_norm_noscale"),
+                                             std::string("layer_norm_noshift"),
                                              std::string("leaky_relu"),
                                              std::string("log"),
                                              std::string("logical_not"),
                                              std::string("matmul_xt"),
                                              std::string("matmul_xt_yt"),
                                              std::string("matmul_yt"),
+                                             std::string("matmul_v2_1dx1d"),
+                                             std::string("matmul_v2_1dx2d"),
+                                             std::string("matmul_v2_2dx1d"),
+                                             std::string("matmul_v2_ndxmd"),
+                                             std::string("matmul_v2_xt"),
+                                             std::string("matmul_v2_xt_yt"),
+                                             std::string("matmul_v2_yt"),
                                              std::string("maxAdaptivePool2D_test1"),
                                              std::string("maxPool_test1"),
                                              std::string("maxPool_test10"),
@@ -163,6 +194,7 @@ static const std::vector<std::string> models{std::string("argmax"),
                                              std::string("split_test_list_tensor"),
                                              std::string("squeeze"),
                                              std::string("squeeze_null_axes"),
+                                             std::string("tanh"),
                                              std::string("unsqueeze"),
                                              std::string("yolo_box_clip_box"),
                                              std::string("yolo_box_default"),
diff --git a/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_cumsum.py b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_cumsum.py
new file mode 100644
index 00000000000..6d612477892
--- /dev/null
+++ b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_cumsum.py
@@ -0,0 +1,43 @@
+#
+# cumsum paddle model generator
+#
+import numpy as np
+from save_model import saveModel
+import paddle as pdpd
+import sys
+
+data_type = 'float32'
+
+def cumsum(name:str, x, axis, dtype=None):
+    pdpd.enable_static()
+    
+    with pdpd.static.program_guard(pdpd.static.Program(), pdpd.static.Program()):
+        data = pdpd.static.data(name='x', shape=x.shape, dtype = data_type)
+        out = pdpd.cumsum(data, axis, dtype=dtype)
+        out = pdpd.cast(out, np.float32)
+
+        cpu = pdpd.static.cpu_places(1)
+        exe = pdpd.static.Executor(cpu[0])
+        # startup program will call initializer to initialize the parameters.
+        exe.run(pdpd.static.default_startup_program())
+
+        outs = exe.run(
+            feed={'x': x},
+            fetch_list=[out])
+
+        saveModel(name, exe, feedkeys=['x'], fetchlist=[out], inputs=[x], outputs=[outs[0]], target_dir=sys.argv[1])
+
+    return outs[0]
+
+def main():
+    x = np.linspace(1, 12, 12, dtype=data_type)
+    x = np.reshape(x, (3, 4))
+
+    cumsum("cumsum", x, axis=None)
+    cumsum("cumsum_f32", x, axis=-1, dtype='float32')
+    cumsum("cumsum_f64", x, axis=0, dtype='float64')
+    cumsum("cumsum_i32", x, axis=0, dtype='int32')
+    cumsum("cumsum_i64", x, axis=0, dtype='int64')
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_embedding.py b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_embedding.py
new file mode 100644
index 00000000000..d20b2d891d1
--- /dev/null
+++ b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_embedding.py
@@ -0,0 +1,170 @@
+#
+# paddle model generator
+# for lookup_table_v2
+# https://www.paddlepaddle.org.cn/documentation/docs/zh/api/paddle/nn/Embedding_cn.html#embedding
+# equal to "gather"
+# 
+import numpy as np
+import sys
+
+from save_model import saveModel
+
+def ngraph_embedding(ids, vocab_embeddings, vocab_size, embedding_dim, padding_idx, sparse):
+    """
+    decomposing embedding with ngraph ops.
+    """
+    import ngraph as ng
+    from ngraph import opset8 as opset
+    from openvino.inference_engine import IECore
+
+    if vocab_embeddings is None:
+        # 
+        vocab_embeddings = np.zeros((vocab_size, embedding_dim)).astype("float32")
+
+    node_ids = ng.parameter(shape=ids.shape, name='ids', dtype=ids.dtype)
+    node_w = ng.parameter(shape=vocab_embeddings.shape, name='w', dtype=vocab_embeddings.dtype)
+
+    if padding_idx == -1:
+        padding_idx += vocab_size
+    
+    if padding_idx is not None:
+        '''
+        mask W
+        '''
+        masked_embeddings = np.ones(vocab_embeddings.shape, dtype='int64')
+        masked_embeddings[padding_idx,:] = 0 # mask
+
+        node_mask = ng.constant(masked_embeddings, name='mask', dtype=vocab_embeddings.dtype)
+        node_masked_w = ng.multiply(node_w, node_mask)
+
+    node_axis = ng.constant([0], name='const0', dtype=np.int64)
+    node_gather = opset.gather(data=node_masked_w if padding_idx else node_w, indices=node_ids, axis=node_axis, batch_dims=0)
+
+    graph = ng.result(node_gather, name='y')
+
+    parameters = [node_ids, node_w]
+    inputs_dict = {'ids': ids, "w": vocab_embeddings}
+
+    # 
+    function = ng.Function(graph, parameters, "embedding")
+
+    ie_network = ng.function_to_cnn(function)
+    ie = IECore()
+    executable_network = ie.load_network(ie_network, 'CPU')
+    output = executable_network.infer(inputs_dict)
+
+    return output
+
+def embedding(name : str, ids, vocab_size, embedding_dim, padding_idx=None, sparse=False, vocab_embeddings=None, compare=False):
+    """
+    padding_idx (int|long|None) 
+    """
+    import paddle
+    paddle.enable_static()
+
+    with paddle.static.program_guard(paddle.static.Program(), paddle.static.Program()):
+        node_ids = paddle.static.data(name = 'Ids', shape = ids.shape, dtype = ids.dtype)
+
+        pretrained_attr = paddle.ParamAttr(name='W',
+                                   initializer=paddle.nn.initializer.Assign(vocab_embeddings),
+                                   trainable=False) if vocab_embeddings is not None else None
+
+        node_embedding = paddle.nn.Embedding(num_embeddings=vocab_size, embedding_dim=embedding_dim, padding_idx=padding_idx, sparse=sparse, weight_attr=pretrained_attr, name=name)
+        node_out = node_embedding(node_ids)
+
+        cpu = paddle.static.cpu_places(1)
+        exe = paddle.static.Executor(cpu[0])
+
+        # startup program will call initializer to initialize the parameters.
+        exe.run(paddle.static.default_startup_program())
+        
+        input_dict = {'Ids': ids}
+        output_vars_list = [node_out]
+
+        infer_results = exe.run(
+                    feed=input_dict,
+                    fetch_list=output_vars_list )
+
+        saveModel(name, exe, feedkeys=list(input_dict.keys()), fetchlist=output_vars_list, inputs=list(input_dict.values()), outputs=infer_results, target_dir=sys.argv[1])
+
+        #
+        outputs = dict()
+        for i in range(len(infer_results)):
+            outputs[output_vars_list[i].name] = infer_results[i]
+
+    #
+    if compare:
+        ng_result = ngraph_embedding(ids, vocab_embeddings, vocab_size, embedding_dim, padding_idx, sparse)
+
+        ng_result = list(ng_result.values())[0]
+        pdpd_result = list(outputs.values())[0]
+    
+        match = np.all(np.isclose(
+            pdpd_result, ng_result, rtol=1e-4, atol=1e-5))
+
+        prefix_color = '\n\033[92m' if match else '\n\033[91m'
+        print(prefix_color +
+              'TestCase {} Result {} '.format(name, match) + '\033[0m\n')
+
+        if not match:
+            np.set_printoptions(precision=2)
+            np.set_printoptions(suppress=True)
+
+            print(prefix_color +
+                  'pdpd_result: {}'.format(pdpd_result) + '\033[0m\n')
+            print(prefix_color +
+                  'ng_result: {}'.format(ng_result) + '\033[0m\n')
+
+            raise ValueError(name + ': OV result does not match PDPD!')
+
+    return outputs
+    
+
+if __name__ == "__main__":
+    import paddle.compat as cpt
+    vocab_size = 17
+    embedding_dim = 31
+
+    table = np.random.random((vocab_size, embedding_dim)).astype("float32")
+
+    #
+    ids = np.random.randint(0, vocab_size, 4).astype("int32")
+    embedding("embedding_0", ids, vocab_size, embedding_dim, vocab_embeddings=table, compare=False)
+
+    #
+    ids = np.random.randint(0, vocab_size, 4).astype("int32")
+    embedding("embedding_sparse", ids, vocab_size, embedding_dim, sparse=True, vocab_embeddings=table, compare=False)    
+
+    # # compare fail
+    ids = np.random.randint(0, vocab_size, 4).astype("int32")
+    embedding("embedding_none_weight", ids, vocab_size, embedding_dim, compare=False)
+
+    #
+    ids = np.random.randint(0, vocab_size, 4).astype("int32")
+    ids = np.squeeze(ids)
+    padding_idx = np.random.choice(ids, 1)[0]
+    # print('padding_idx {}, ids {}'.format(padding_idx, ids))
+    outputs = embedding("embedding_paddings", ids, vocab_size, embedding_dim, padding_idx=int(padding_idx), vocab_embeddings=table, compare=False)
+    # print('outputs {}'.format(outputs))
+
+    # corner case
+    ids = np.random.randint(0, vocab_size, 4).astype("int32")
+    pick = np.random.choice(4, 1)[0] # pick randomly to be max vacab_size -1
+    ids[pick] = vocab_size-1
+    padding_idx = -1
+    # print('padding_idx {}, ids {}'.format(padding_idx, ids))
+    outputs = embedding("embedding_paddings_neg1", ids, vocab_size, embedding_dim, padding_idx=int(padding_idx), vocab_embeddings=table, compare=False)
+    # print('outputs {}'.format(outputs))    
+
+    #
+    ids = np.random.randint(low=0, high=vocab_size, size=(2, 4, 5)).astype("int32")
+    embedding("embedding_tensorIds", ids, vocab_size, embedding_dim, vocab_embeddings=table, compare=False)
+    
+    #
+    ids = np.random.randint(low=0, high=vocab_size, size=(2, 4, 5)).astype("int32")
+    flatten_idx = ids.flatten()
+    padding_idx = np.random.choice(flatten_idx, 1)[0]
+    # print('padding_idx {}'.format(padding_idx))
+    outputs = embedding("embedding_tensorIds_paddings", ids, vocab_size, embedding_dim, padding_idx=cpt.long_type(padding_idx), vocab_embeddings=table, compare=False)
+    # print('outputs {}'.format(outputs))
+   
\ No newline at end of file
diff --git a/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_fill_any_like.py b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_fill_any_like.py
new file mode 100644
index 00000000000..9d74dfcdb72
--- /dev/null
+++ b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_fill_any_like.py
@@ -0,0 +1,43 @@
+#
+# fill_any_like paddle model generator
+#
+import numpy as np
+from save_model import saveModel
+import paddle as pdpd
+import sys
+
+data_type = 'float32'
+
+def fill_any_like(name:str, x, value, dtype=None):
+    pdpd.enable_static()
+    
+    with pdpd.static.program_guard(pdpd.static.Program(), pdpd.static.Program()):
+        data = pdpd.static.data(name='x', shape=x.shape, dtype = data_type)
+        out = pdpd.full_like(data, value, dtype=dtype)
+        out = pdpd.cast(out, np.float32)
+
+        cpu = pdpd.static.cpu_places(1)
+        exe = pdpd.static.Executor(cpu[0])
+        # startup program will call initializer to initialize the parameters.
+        exe.run(pdpd.static.default_startup_program())
+
+        outs = exe.run(
+            feed={'x': x},
+            fetch_list=[out])
+
+        saveModel(name, exe, feedkeys=['x'], fetchlist=[out], inputs=[x], outputs=[outs[0]], target_dir=sys.argv[1])
+
+    return outs[0]
+
+def main():
+    x = np.random.rand(8, 24, 32).astype(data_type)
+
+    fill_any_like("fill_any_like", x, 1.2)
+    fill_any_like("fill_any_like_f16", x, 1.0, dtype='float16')
+    fill_any_like("fill_any_like_f32", x, 1.2, dtype='float32')
+    fill_any_like("fill_any_like_f64", x, 1.2, dtype='float64')
+    fill_any_like("fill_any_like_i32", x, 2, dtype='int32')
+    fill_any_like("fill_any_like_i64", x, 10, dtype='int64')
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_gelu.py b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_gelu.py
new file mode 100644
index 00000000000..3ac50226ed6
--- /dev/null
+++ b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_gelu.py
@@ -0,0 +1,38 @@
+#
+# gelu paddle model generator
+#
+import numpy as np
+from save_model import saveModel
+import paddle as pdpd
+import sys
+
+data_type = 'float32'
+
+def gelu(name:str, x, approximate=False):
+    pdpd.enable_static()
+    
+    with pdpd.static.program_guard(pdpd.static.Program(), pdpd.static.Program()):
+        data = pdpd.static.data(name='x', shape=x.shape, dtype = data_type)
+        out = pdpd.fluid.layers.gelu(data, approximate=approximate)
+
+        cpu = pdpd.static.cpu_places(1)
+        exe = pdpd.static.Executor(cpu[0])
+        # startup program will call initializer to initialize the parameters.
+        exe.run(pdpd.static.default_startup_program())
+
+        outs = exe.run(
+            feed={'x': x},
+            fetch_list=[out])
+
+        saveModel(name, exe, feedkeys=['x'], fetchlist=[out], inputs=[x], outputs=[outs[0]], target_dir=sys.argv[1])
+
+    return outs[0]
+
+def main():
+    x = np.random.rand(8, 24, 32).astype(data_type)
+
+    gelu("gelu_erf", x)
+    gelu("gelu_tanh", x, True)
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_layer_norm.py b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_layer_norm.py
new file mode 100644
index 00000000000..5cd60061aad
--- /dev/null
+++ b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_layer_norm.py
@@ -0,0 +1,44 @@
+#
+# layer_norm paddle model generator
+#
+import numpy as np
+from paddle.fluid import param_attr
+from save_model import saveModel
+import paddle as pdpd
+import sys
+
+data_type = 'float32'
+
+def layer_norm(name:str, x, begin_norm_axis, scale=True, shift=True, param_attr=None, bias_attr=None):
+    pdpd.enable_static()
+    
+    with pdpd.static.program_guard(pdpd.static.Program(), pdpd.static.Program()):
+        data = pdpd.static.data(name='x', shape=x.shape, dtype = data_type)
+        out = pdpd.static.nn.layer_norm(input=data, scale=scale, shift=shift,\
+            begin_norm_axis=begin_norm_axis, param_attr=param_attr, bias_attr=bias_attr)
+
+        cpu = pdpd.static.cpu_places(1)
+        exe = pdpd.static.Executor(cpu[0])
+        # startup program will call initializer to initialize the parameters.
+        exe.run(pdpd.static.default_startup_program())
+
+        outs = exe.run(
+            feed={'x': x},
+            fetch_list=[out])
+
+        saveModel(name, exe, feedkeys=['x'], fetchlist=[out], inputs=[x], outputs=[outs[0]], target_dir=sys.argv[1])
+
+    return outs[0]
+
+def main():
+    x = np.random.rand(8, 24, 32).astype(data_type)
+    random_data = np.random.rand(24 * 32).astype(data_type)
+    attr = pdpd.ParamAttr(
+              initializer=pdpd.fluid.initializer.NumpyArrayInitializer(random_data))
+    layer_norm("layer_norm", x, begin_norm_axis=1, param_attr=attr, bias_attr=attr)
+    layer_norm("layer_norm_noscale", x, scale=False, begin_norm_axis=2)
+    layer_norm("layer_norm_noshift", x, shift=False, begin_norm_axis=1)
+    layer_norm("layer_norm_noall", x, scale=False, shift=False, begin_norm_axis=1)
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_matmul_v2.py b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_matmul_v2.py
new file mode 100644
index 00000000000..08a5eab50dd
--- /dev/null
+++ b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_matmul_v2.py
@@ -0,0 +1,59 @@
+import numpy as np
+from save_model import saveModel
+import sys
+
+def matmul(name, x1, x2, x_transpose=False, y_transpose=False):
+    import paddle as pdpd
+
+    pdpd.enable_static()
+    with pdpd.static.program_guard(pdpd.static.Program(), pdpd.static.Program()):
+        node_x1 = pdpd.static.data(name='x1', shape=x1.shape, dtype=x1.dtype)
+        node_x2 = pdpd.static.data(name='x2', shape=x2.shape, dtype=x2.dtype)
+        result = pdpd.matmul(node_x1, node_x2, x_transpose, y_transpose)
+        #result = pdpd.static.nn.batch_norm(mul_node, use_global_stats=True)
+
+        cpu = pdpd.static.cpu_places(1)
+        exe = pdpd.static.Executor(cpu[0])
+        # startup program will call initializer to initialize the parameters.
+        exe.run(pdpd.static.default_startup_program())
+
+        outs = exe.run(
+            feed={'x1': x1, 'x2': x2},
+            fetch_list=[result])
+        saveModel(name, exe, feedkeys=['x1', 'x2'], fetchlist=[result], inputs=[x1, x2], outputs=[outs[0]], target_dir=sys.argv[1])
+
+    return outs[0]
+
+
+if __name__ == "__main__":
+    input_2x5 = np.array([[1, 2, 3, 4, 5],
+                       [6, 7, 8, 9, 10]]).astype(np.float32)
+
+    input_5x3 = np.array([[1, 2, 3],
+                       [4, 5, 6],
+                       [7, 8, 9],
+                       [10, 11, 12],
+                       [13, 14, 15]]).astype(np.float32)
+
+    input_5x2 = np.array([[1, 2],
+                          [4, 5],
+                          [7, 8],
+                          [10, 11],
+                          [13, 14]]).astype(np.float32)
+
+    input_2x3 = np.array([[1, 2, 3],
+                          [4, 5, 6]]).astype(np.float32)
+
+    input_1d = np.array([2, 3]).astype(np.float32)
+
+    input_nd = np.random.rand(2, 1, 10, 3).astype(np.float32)
+    input_md = np.random.rand(3, 3, 4).astype(np.float32)
+
+    matmul("matmul_v2_1dx1d", input_1d, input_1d)
+    matmul("matmul_v2_1dx2d", input_1d, input_2x3)
+    matmul("matmul_v2_2dx1d", input_5x2, input_1d)
+    matmul("matmul_v2_ndxmd", input_nd, input_md)
+
+    matmul("matmul_v2_xt", input_2x5, input_2x3, x_transpose=True, y_transpose=False)
+    matmul("matmul_v2_yt", input_2x3, input_5x3, x_transpose=False, y_transpose=True)
+    matmul("matmul_v2_xt_yt", input_2x5, input_5x2, x_transpose=True, y_transpose=True)
diff --git a/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_tanh.py b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_tanh.py
new file mode 100644
index 00000000000..40847a7417d
--- /dev/null
+++ b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_tanh.py
@@ -0,0 +1,37 @@
+#
+# tanh paddle model generator
+#
+import numpy as np
+from save_model import saveModel
+import paddle as pdpd
+import sys
+
+data_type = 'float32'
+
+def tanh(name:str, x):
+    pdpd.enable_static()
+    
+    with pdpd.static.program_guard(pdpd.static.Program(), pdpd.static.Program()):
+        data = pdpd.static.data(name='x', shape=x.shape, dtype = data_type)
+        out = pdpd.tanh(data)
+        
+        cpu = pdpd.static.cpu_places(1)
+        exe = pdpd.static.Executor(cpu[0])
+        # startup program will call initializer to initialize the parameters.
+        exe.run(pdpd.static.default_startup_program())
+
+        outs = exe.run(
+            feed={'x': x},
+            fetch_list=[out])
+
+        saveModel(name, exe, feedkeys=['x'], fetchlist=[out], inputs=[x], outputs=[outs[0]], target_dir=sys.argv[1])
+
+    return outs[0]
+
+def main():
+    x = np.random.rand(8, 24, 32).astype(data_type)
+    
+    tanh("tanh", x)
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/ngraph/test/frontend/shared/CMakeLists.txt b/ngraph/test/frontend/shared/CMakeLists.txt
index c4dda394fb1..0c1f6f133e2 100644
--- a/ngraph/test/frontend/shared/CMakeLists.txt
+++ b/ngraph/test/frontend/shared/CMakeLists.txt
@@ -12,6 +12,6 @@ add_library(${TARGET_NAME} STATIC ${LIBRARY_SRC} ${LIBRARY_HEADERS})
 target_include_directories(${TARGET_NAME} PUBLIC ${CMAKE_CURRENT_SOURCE_DIR}/include)
 target_include_directories(${TARGET_NAME} PUBLIC ${CMAKE_CURRENT_SOURCE_DIR}/../..)
 target_link_libraries(${TARGET_NAME} PUBLIC frontend_manager
-        ngraph::ngraph cnpy ie_backend ngraph_test_util commonTestUtils)
+        ngraph::ngraph cnpy ie_backend ngraph_test_util commonTestUtils openvino::util)
 
 add_clang_format_target(${TARGET_NAME}_clang FOR_TARGETS ${TARGET_NAME})
diff --git a/ngraph/test/frontend/shared/include/utils.hpp b/ngraph/test/frontend/shared/include/utils.hpp
index a335b0a0d97..b07137d64fa 100644
--- a/ngraph/test/frontend/shared/include/utils.hpp
+++ b/ngraph/test/frontend/shared/include/utils.hpp
@@ -10,8 +10,8 @@
 
 #include "backend.hpp"
 #include "common_test_utils/file_utils.hpp"
-#include "ngraph/env_util.hpp"
-#include "ngraph/file_util.hpp"
+#include "openvino/util/env_util.hpp"
+#include "openvino/util/file_util.hpp"
 
 // Helper functions
 namespace FrontEndTestUtils {
@@ -54,7 +54,7 @@ inline int set_test_env(const char* name, const char* value) {
 inline void setupTestEnv() {
     NGRAPH_SUPPRESS_DEPRECATED_START
     std::string fePath =
-        ngraph::file_util::get_directory(ngraph::runtime::Backend::get_backend_shared_library_search_directory());
+        ov::util::get_directory(ngraph::runtime::Backend::get_backend_shared_library_search_directory());
     set_test_env("OV_FRONTEND_PATH", fePath.c_str());
     NGRAPH_SUPPRESS_DEPRECATED_END
 }
diff --git a/ngraph/test/node_input_output.cpp b/ngraph/test/node_input_output.cpp
index 0b99f8fb207..ec4c1182e48 100644
--- a/ngraph/test/node_input_output.cpp
+++ b/ngraph/test/node_input_output.cpp
@@ -96,3 +96,27 @@ TEST(node_input_output, output_create_const) {
 
     EXPECT_THROW(add->output(1), std::out_of_range);
 }
+
+TEST(node_input_output, input_set_argument) {
+    auto x = make_shared<op::Parameter>(element::f32, Shape{1});
+    auto y = make_shared<op::Parameter>(element::f32, Shape{2});
+    auto z = make_shared<op::Parameter>(element::f32, Shape{3});
+
+    auto add = make_shared<op::v1::Add>(x, y);
+
+    EXPECT_EQ(add->get_input_size(), 2);
+    EXPECT_EQ(add->input(0).get_shape(), Shape{1});
+    EXPECT_EQ(add->input(1).get_shape(), Shape{2});
+
+    add->set_argument(1, z);
+
+    EXPECT_EQ(add->get_input_size(), 2);
+    EXPECT_EQ(add->input(0).get_shape(), Shape{1});
+    EXPECT_EQ(add->input(1).get_shape(), Shape{3});
+
+    add->set_arguments(NodeVector{z, x});
+
+    EXPECT_EQ(add->get_input_size(), 2);
+    EXPECT_EQ(add->input(0).get_shape(), Shape{3});
+    EXPECT_EQ(add->input(1).get_shape(), Shape{1});
+}
diff --git a/ngraph/test/opset.cpp b/ngraph/test/opset.cpp
index 24a6e4d2857..a2fd32bba55 100644
--- a/ngraph/test/opset.cpp
+++ b/ngraph/test/opset.cpp
@@ -6,6 +6,7 @@
 
 #include <gtest/gtest.h>
 
+#include "openvino/op/op.hpp"
 #include "openvino/opsets/opset1.hpp"
 #include "openvino/opsets/opset2.hpp"
 #include "openvino/opsets/opset3.hpp"
@@ -142,3 +143,64 @@ TEST(opset, opset8_dump) {
     std::cout << std::endl;
     ASSERT_EQ(163, opset.get_types_info().size());
 }
+
+class MyOpOld : public ov::op::Op {
+public:
+    static constexpr ov::DiscreteTypeInfo type_info{"MyOpOld", 0};
+    const ov::DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+    MyOpOld() = default;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const ov::OutputVector& inputs) const override {
+        return nullptr;
+    }
+};
+
+constexpr ov::DiscreteTypeInfo MyOpOld::type_info;
+
+class MyOpNewFromOld : public MyOpOld {
+public:
+    OPENVINO_OP("MyOpNewFromOld", "custom_opset", MyOpOld);
+    BWDCMP_RTTI_DECLARATION;
+    MyOpNewFromOld() = default;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const ov::OutputVector& inputs) const override {
+        return nullptr;
+    }
+};
+
+BWDCMP_RTTI_DEFINITION(MyOpNewFromOld);
+
+class MyOpIncorrect : public MyOpOld {
+public:
+    OPENVINO_OP("MyOpIncorrect", "custom_opset", MyOpOld);
+    MyOpIncorrect() = default;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const ov::OutputVector& inputs) const override {
+        return nullptr;
+    }
+};
+
+class MyOpNew : public ov::op::Op {
+public:
+    OPENVINO_OP("MyOpNew", "custom_opset", MyOpOld);
+    MyOpNew() = default;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const ov::OutputVector& inputs) const override {
+        return nullptr;
+    }
+};
+
+TEST(opset, custom_opset) {
+    ov::OpSet opset;
+    opset.insert<MyOpOld>();
+    opset.insert<MyOpNewFromOld>();
+    opset.insert<MyOpIncorrect>();
+    opset.insert<MyOpNew>();
+    ASSERT_EQ(opset.get_types_info().size(), 3);
+    ASSERT_TRUE(opset.contains_type("MyOpNew"));
+    ASSERT_TRUE(opset.contains_type("MyOpOld"));
+    ASSERT_TRUE(opset.contains_type("MyOpNewFromOld"));
+    ASSERT_FALSE(opset.contains_type("MyOpIncorrect"));
+}
diff --git a/ngraph/test/preprocess.cpp b/ngraph/test/preprocess.cpp
index 0bbe570facb..0e1a66ea2af 100644
--- a/ngraph/test/preprocess.cpp
+++ b/ngraph/test/preprocess.cpp
@@ -17,6 +17,7 @@ using namespace ngraph::test;
 static std::shared_ptr<Function> create_simple_function(element::Type type, const PartialShape& shape) {
     auto data1 = std::make_shared<op::v0::Parameter>(type, shape);
     data1->set_friendly_name("input1");
+    data1->get_output_tensor(0).set_names({"tensor_input1"});
     auto res = std::make_shared<op::v0::Result>(data1);
     res->set_friendly_name("Result");
     return std::make_shared<Function>(ResultVector{res}, ParameterVector{data1});
@@ -25,12 +26,14 @@ static std::shared_ptr<Function> create_simple_function(element::Type type, cons
 static std::shared_ptr<Function> create_2inputs(element::Type type, const PartialShape& shape) {
     auto data1 = std::make_shared<op::v0::Parameter>(type, shape);
     data1->set_friendly_name("input1");
+    data1->get_output_tensor(0).set_names({"tensor_input1"});
     auto data2 = std::make_shared<op::v0::Parameter>(type, shape);
     data2->set_friendly_name("input2");
+    data1->get_output_tensor(0).set_names({"tensor_input2"});
     auto res1 = std::make_shared<op::v0::Result>(data1);
-    res1->set_friendly_name("Result");
+    res1->set_friendly_name("Result1");
     auto res2 = std::make_shared<op::v0::Result>(data2);
-    res2->set_friendly_name("Result");
+    res2->set_friendly_name("Result2");
     return std::make_shared<Function>(ResultVector{res1, res2}, ParameterVector{data1, data2});
 }
 
@@ -68,49 +71,51 @@ TEST(pre_post_process, convert_element_type_and_scale) {
                                        .scale(2.f)
                                        .convert_element_type(element::i8)))
             .build(f);
+    EXPECT_EQ(f->get_parameters().front()->get_element_type(), element::i16);
+    EXPECT_EQ(f->get_output_element_type(0), element::i8);
 
     auto result = std::make_shared<HostTensor>();
     f->evaluate({result},
                 {make_host_tensor<element::i16>(Shape{1, 3, 2, 2}, {2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 10000, 200})});
     auto result_val = read_vector<int8_t>(result);
     EXPECT_TRUE(all_close(std::vector<int8_t>{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, (int8_t)5000, 100}, result_val));
-    EXPECT_EQ(f->get_parameters().front()->get_element_type(), element::i16);
-
-    ASSERT_EQ(f->get_output_element_type(0), element::i8);
 }
 
 TEST(pre_post_process, convert_element_type_from_unknown) {
     auto f = create_simple_function(element::i32, Shape{1, 3, 224, 224});
-    ASSERT_ANY_THROW(
+    ASSERT_THROW(
         f = PrePostProcessor()
                 .input(InputInfo().preprocess(
                     PreProcessSteps().convert_element_type(element::dynamic).convert_element_type(element::i32)))
-                .build(f));
+                .build(f),
+        ov::AssertFailure);
 }
 
 TEST(pre_post_process, convert_element_type_no_match) {
     auto f = create_simple_function(element::i32, Shape{1, 3, 224, 224});
-    ASSERT_ANY_THROW(f = PrePostProcessor()
-                             .input(InputInfo()
-                                        .tensor(InputTensorInfo().set_element_type(element::i32))
-                                        .preprocess(PreProcessSteps().convert_element_type(element::f32).scale(2.0f)))
-                             .build(f));
+    ASSERT_THROW(f = PrePostProcessor()
+                         .input(InputInfo()
+                                    .tensor(InputTensorInfo().set_element_type(element::i32))
+                                    .preprocess(PreProcessSteps().convert_element_type(element::f32).scale(2.0f)))
+                         .build(f),
+                 ov::AssertFailure);
 }
 
 TEST(pre_post_process, scale_not_float) {
     auto f = create_simple_function(element::i32, Shape{1, 3, 224, 224});
-    ASSERT_ANY_THROW(
+    ASSERT_THROW(
         f = PrePostProcessor()
                 .input(InputInfo().preprocess(PreProcessSteps().convert_element_type(element::f32).scale(2.0f)))
-                .build(f));
+                .build(f),
+        ov::AssertFailure);
 }
 
 TEST(pre_post_process, mean_not_float) {
     auto f = create_simple_function(element::i32, Shape{1, 3, 224, 224});
-    ASSERT_ANY_THROW(
-        f = PrePostProcessor()
-                .input(InputInfo().preprocess(PreProcessSteps().convert_element_type(element::f32).mean(2.0f)))
-                .build(f));
+    ASSERT_THROW(f = PrePostProcessor()
+                         .input(InputInfo().preprocess(PreProcessSteps().convert_element_type(element::f32).mean(2.0f)))
+                         .build(f),
+                 ov::AssertFailure);
 }
 
 TEST(pre_post_process, tensor_element_type_and_scale) {
@@ -121,13 +126,14 @@ TEST(pre_post_process, tensor_element_type_and_scale) {
                        .preprocess(PreProcessSteps().scale(2.0f).convert_element_type(element::i8)))
             .build(f);
 
+    EXPECT_EQ(f->get_parameters().front()->get_element_type(), element::f32);
+    EXPECT_EQ(f->get_output_element_type(0), element::i8);
+    EXPECT_EQ(f->get_parameters().front()->get_layout(), Layout());
+
     auto result = std::make_shared<HostTensor>();
     f->evaluate({result}, {make_host_tensor<element::f32>(Shape{1, 3, 1, 1}, {2., 4., 6.})});
     auto result_val = read_vector<int8_t>(result);
     EXPECT_TRUE(all_close(std::vector<int8_t>{1, 2, 3}, result_val));
-    EXPECT_EQ(f->get_parameters().front()->get_element_type(), element::f32);
-
-    ASSERT_EQ(f->get_output_element_type(0), element::i8);
 }
 
 TEST(pre_post_process, custom_preprocessing) {
@@ -148,6 +154,8 @@ TEST(pre_post_process, custom_preprocessing) {
 
 TEST(pre_post_process, test_lvalue) {
     auto f = create_simple_function(element::i8, Shape{1, 3, 1, 1});
+    auto name = f->get_parameters()[0]->get_friendly_name();
+    auto tensor_names = f->get_parameters().front()->get_output_tensor(0).get_names();
     auto p = PrePostProcessor();
     auto p1 = std::move(p);
     p = std::move(p1);
@@ -180,14 +188,16 @@ TEST(pre_post_process, test_lvalue) {
     }
     p.input(std::move(inputInfo));
     f = p.build(f);
+    EXPECT_EQ(f->get_parameters().front()->get_element_type(), element::f32);
+    EXPECT_EQ(f->get_parameters().front()->get_friendly_name(), name);
+    EXPECT_EQ(f->get_parameters().front()->get_layout(), "?CHW");
+    EXPECT_EQ(f->get_parameters().front()->get_output_tensor(0).get_names(), tensor_names);
+    EXPECT_EQ(f->get_output_element_type(0), element::i8);
 
     auto result = std::make_shared<HostTensor>();
     f->evaluate({result}, {make_host_tensor<element::f32>(Shape{1, 3, 1, 1}, {-9., 17., -1.})});
     auto result_val = read_vector<int8_t>(result);
     EXPECT_TRUE(all_close(std::vector<int8_t>{3, 2, 1}, result_val));
-    EXPECT_EQ(f->get_parameters().front()->get_element_type(), element::f32);
-
-    ASSERT_EQ(f->get_output_element_type(0), element::i8);
 }
 
 TEST(pre_post_process, test_2_inputs_basic) {
@@ -206,14 +216,42 @@ TEST(pre_post_process, test_2_inputs_basic) {
     EXPECT_TRUE(all_close_f(std::vector<float>{1, 2, 3}, result2_val));
 }
 
+TEST(pre_post_process, reuse_network_layout_no_tensor_info) {
+    auto f = create_simple_function(element::f32, PartialShape{Dimension::dynamic(), 3, 2, 1});
+    f->get_parameters().front()->set_layout("NC??");
+    f = PrePostProcessor()
+            .input(InputInfo().preprocess(PreProcessSteps().mean({1.f, 2.f, 3.f}).scale({2.f, 3.f, 4.f})))
+            .build(f);
+    EXPECT_EQ(f->get_parameters().front()->get_layout(), "NC??");
+}
+
+TEST(pre_post_process, reuse_network_layout_tensor_info) {
+    auto f = create_simple_function(element::u8, PartialShape{Dimension::dynamic(), 3, 2, 1});
+    f->get_parameters().front()->set_layout("NC??");
+    f = PrePostProcessor()
+            .input(InputInfo()
+                       .tensor(InputTensorInfo().set_element_type(element::f32))
+                       .preprocess(PreProcessSteps()
+                                       .mean({1.f, 2.f, 3.f})
+                                       .scale({2.f, 3.f, 4.f})
+                                       .convert_element_type(element::u8)))
+            .build(f);
+    EXPECT_EQ(f->get_parameters().front()->get_layout(), "NC??");
+}
+
 TEST(pre_post_process, mean_scale_vector_tensor_layout) {
     auto f = create_simple_function(element::f32, PartialShape{Dimension::dynamic(), 3, 2, 1});
-    ASSERT_EQ(f->get_output_element_type(0), element::f32);
+    auto name = f->get_parameters().front()->get_friendly_name();
+    auto tensor_names = f->get_parameters().front()->get_output_tensor(0).get_names();
     f = PrePostProcessor()
             .input(InputInfo()
                        .tensor(InputTensorInfo().set_layout("NC??"))
                        .preprocess(PreProcessSteps().mean({1.f, 2.f, 3.f}).scale({2.f, 3.f, 4.f})))
             .build(f);
+    EXPECT_EQ(f->get_parameters().front()->get_friendly_name(), name);
+    EXPECT_EQ(f->get_parameters().front()->get_layout(), "NC??");
+    EXPECT_EQ(f->get_parameters().front()->get_output_tensor(0).get_names(), tensor_names);
+    EXPECT_EQ(f->get_output_element_type(0), element::f32);
 
     auto result = std::make_shared<HostTensor>();
     f->evaluate({result}, {make_host_tensor<ngraph::element::f32>(Shape{1, 3, 2, 1}, {5., 1., 5., 11., 11., -1.})});
@@ -221,19 +259,82 @@ TEST(pre_post_process, mean_scale_vector_tensor_layout) {
     EXPECT_TRUE(all_close_f(std::vector<float>{2., 0., 1., 3., 2., -1.}, result_val));
 }
 
+TEST(pre_post_process, mean_scale_dynamic_layout) {
+    auto f = create_simple_function(element::f32,
+                                    PartialShape{Dimension::dynamic(), Dimension::dynamic(), Dimension::dynamic(), 3});
+    auto name = f->get_parameters().front()->get_friendly_name();
+    auto tensor_names = f->get_parameters().front()->get_output_tensor(0).get_names();
+    f = PrePostProcessor()
+            .input(InputInfo()
+                       .tensor(InputTensorInfo().set_layout("N...C"))
+                       .preprocess(PreProcessSteps().mean({1.f, 2.f, 3.f}).scale({2.f, 3.f, 4.f})))
+            .build(f);
+
+    EXPECT_EQ(f->get_parameters().front()->get_friendly_name(), name);
+    EXPECT_EQ(f->get_parameters().front()->get_layout(), "N...C");
+    EXPECT_EQ(f->get_parameters().front()->get_output_tensor(0).get_names(), tensor_names);
+    EXPECT_EQ(f->get_output_element_type(0), element::f32);
+
+    auto result = std::make_shared<HostTensor>();
+    f->evaluate({result}, {make_host_tensor<ngraph::element::f32>(Shape{1, 2, 1, 3}, {5., 2., 7., 7., 8., -1.})});
+    auto result_val = read_vector<float>(result);
+    EXPECT_TRUE(all_close_f(std::vector<float>{2., 0., 1., 3., 2., -1.}, result_val));
+}
+
 TEST(pre_post_process, scale_vector_no_channels_layout) {
+    auto f = create_simple_function(element::f32, Shape{1, 3, 224, 224});
+    EXPECT_EQ(f->get_output_element_type(0), element::f32);
+    EXPECT_THROW(f = PrePostProcessor()
+                         .input(InputInfo()
+                                    .tensor(InputTensorInfo().set_layout("N?HW"))
+                                    .preprocess(PreProcessSteps().scale({0.1f, 0.2f, 0.3f})))
+                         .build(f),
+                 ov::AssertFailure);
+}
+
+TEST(pre_post_process, scale_vector_dim_mismatch) {
+    auto f = create_simple_function(element::f32, Shape{1, 3, 224, 224});
+    EXPECT_EQ(f->get_output_element_type(0), element::f32);
+    EXPECT_THROW(f = PrePostProcessor()
+                         .input(InputInfo()
+                                    .tensor(InputTensorInfo().set_layout("NCHW"))
+                                    .preprocess(PreProcessSteps().scale({0.1f, 0.2f, 0.3f, 0.4f})))
+                         .build(f),
+                 ov::AssertFailure);
+}
+
+TEST(pre_post_process, scale_vector_channels_out_of_range) {
     auto f = create_simple_function(element::f32, Shape{1, 3, 224, 224});
     ASSERT_EQ(f->get_output_element_type(0), element::f32);
-    ASSERT_ANY_THROW(f = PrePostProcessor()
-                             .input(InputInfo()
-                                        .tensor(InputTensorInfo().set_layout("N?HW"))
-                                        .preprocess(PreProcessSteps().scale({0.1f, 0.2f, 0.3f})))
-                             .build(f));
+    ASSERT_THROW(f = PrePostProcessor()
+                         .input(InputInfo()
+                                    .tensor(InputTensorInfo().set_layout("0123C"))
+                                    .preprocess(PreProcessSteps().scale({0.1f, 0.2f, 0.3f})))
+                         .build(f),
+                 ov::AssertFailure);
 }
 
 TEST(pre_post_process, mean_vector_no_layout) {
     auto f = create_simple_function(element::f32, PartialShape{Dimension::dynamic(), 3, 224, 224});
     ASSERT_EQ(f->get_output_element_type(0), element::f32);
-    ASSERT_ANY_THROW(
-        f = PrePostProcessor().input(InputInfo().preprocess(PreProcessSteps().mean({0.1f, 0.2f, 0.3f}))).build(f));
+    ASSERT_THROW(
+        f = PrePostProcessor().input(InputInfo().preprocess(PreProcessSteps().mean({0.1f, 0.2f, 0.3f}))).build(f),
+        ov::AssertFailure);
+}
+
+TEST(pre_post_process, mean_vector_dynamic_channels_shape) {
+    auto f = create_simple_function(
+        element::f32,
+        PartialShape{Dimension::dynamic(), Dimension::dynamic(), Dimension::dynamic(), Dimension::dynamic()});
+    EXPECT_EQ(f->get_output_element_type(0), element::f32);
+    f = PrePostProcessor()
+            .input(InputInfo()
+                       .tensor(InputTensorInfo().set_layout("NCHW"))
+                       .preprocess(PreProcessSteps().mean({0.1f, 0.2f, 0.3f})))
+            .build(f);
+    EXPECT_EQ(f->get_output_element_type(0), element::f32);
+    auto result = std::make_shared<HostTensor>();
+    EXPECT_NO_THROW(f->evaluate({result}, {make_host_tensor<ngraph::element::f32>(Shape{1, 3, 1, 1}, {1., 2., 3.})}));
+    EXPECT_ANY_THROW(
+        f->evaluate({result}, {make_host_tensor<ngraph::element::f32>(Shape{1, 4, 1, 1}, {1., 2., 3., 4.})}));
 }
diff --git a/ngraph/test/rtti.cpp b/ngraph/test/rtti.cpp
new file mode 100644
index 00000000000..7186f4d3d42
--- /dev/null
+++ b/ngraph/test/rtti.cpp
@@ -0,0 +1,95 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "gtest/gtest.h"
+#include "ngraph/node.hpp"
+#include "util/all_close_f.hpp"
+#include "util/test_tools.hpp"
+
+using namespace ngraph;
+using namespace std;
+
+class OpType : public ngraph::op::Op {
+public:
+    OPENVINO_OP("OpType");
+    OpType() = default;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& inputs) const override {
+        return nullptr;
+    }
+};
+
+class OpTypeVersion : public ngraph::op::Op {
+public:
+    OPENVINO_OP("OpTypeVersion", "my_version");
+    OpTypeVersion() = default;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& inputs) const override {
+        return nullptr;
+    }
+};
+
+class OpTypeVersionParent : public OpType {
+public:
+    OPENVINO_OP("OpTypeVersionParent", "my_version", OpType);
+    OpTypeVersionParent() = default;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& inputs) const override {
+        return nullptr;
+    }
+};
+
+class OpTypeVersionParentOld : public OpType {
+public:
+    OPENVINO_OP("OpTypeVersionParentOld", "my_version1", OpType, 1);
+    OpTypeVersionParentOld() = default;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& inputs) const override {
+        return nullptr;
+    }
+};
+
+TEST(rtti, op_with_type) {
+    auto op = OpType();
+    auto type_info = op.get_type_info();
+    ASSERT_EQ(type_info, OpType::get_type_info_static());
+    ASSERT_EQ(strcmp(type_info.name, "OpType"), 0);
+    ASSERT_EQ(type_info.version, 0);
+    ASSERT_EQ(strcmp(type_info.version_id, "extension"), 0);
+    ASSERT_NE(type_info.parent, nullptr);
+    ASSERT_EQ(*type_info.parent, ngraph::op::Op::get_type_info_static());
+}
+
+TEST(rtti, op_with_type_version) {
+    auto op = OpTypeVersion();
+    auto type_info = op.get_type_info();
+    ASSERT_EQ(type_info, OpTypeVersion::get_type_info_static());
+    ASSERT_EQ(strcmp(type_info.name, "OpTypeVersion"), 0);
+    ASSERT_EQ(type_info.version, 0);
+    ASSERT_EQ(strcmp(type_info.version_id, "my_version"), 0);
+    ASSERT_NE(type_info.parent, nullptr);
+    ASSERT_EQ(*type_info.parent, ngraph::op::Op::get_type_info_static());
+}
+
+TEST(rtti, op_with_type_version_parent) {
+    auto op = OpTypeVersionParent();
+    auto type_info = op.get_type_info();
+    ASSERT_EQ(type_info, OpTypeVersionParent::get_type_info_static());
+    ASSERT_EQ(strcmp(type_info.name, "OpTypeVersionParent"), 0);
+    ASSERT_EQ(type_info.version, 0);
+    ASSERT_EQ(strcmp(type_info.version_id, "my_version"), 0);
+    ASSERT_NE(type_info.parent, nullptr);
+    ASSERT_EQ(*type_info.parent, OpType::get_type_info_static());
+}
+
+TEST(rtti, op_with_type_version_parent_old) {
+    auto op = OpTypeVersionParentOld();
+    auto type_info = op.get_type_info();
+    ASSERT_EQ(type_info, OpTypeVersionParentOld::get_type_info_static());
+    ASSERT_EQ(strcmp(type_info.name, "OpTypeVersionParentOld"), 0);
+    ASSERT_EQ(strcmp(type_info.version_id, "my_version1"), 0);
+    ASSERT_EQ(type_info.version, 1);
+    ASSERT_NE(type_info.parent, nullptr);
+    ASSERT_EQ(*type_info.parent, OpType::get_type_info_static());
+}
diff --git a/ngraph/test/runtime/ie/ie_executable.cpp b/ngraph/test/runtime/ie/ie_executable.cpp
index cd31f1e0a7e..bce24306031 100644
--- a/ngraph/test/runtime/ie/ie_executable.cpp
+++ b/ngraph/test/runtime/ie/ie_executable.cpp
@@ -3,6 +3,7 @@
 //
 
 #include "ie_executable.hpp"
+
 #include "ie_tensor.hpp"
 #include "ngraph/opsets/opset.hpp"
 #include "ngraph/pass/manager.hpp"
@@ -14,95 +15,122 @@ using namespace ngraph;
 
 NGRAPH_SUPPRESS_DEPRECATED_START
 
-namespace
-{
-    InferenceEngine::Blob::Ptr fill_blob(InferenceEngine::SizeVector shape,
-                                         const void* data,
-                                         size_t data_size,
-                                         const element::Type& elem_type)
-    {
-        InferenceEngine::Layout layout;
-        switch (shape.size())
-        {
-        case 0: layout = InferenceEngine::Layout::SCALAR; break;
-        case 1: layout = InferenceEngine::Layout::C; break;
-        case 2: layout = InferenceEngine::Layout::NC; break;
-        case 3: layout = InferenceEngine::Layout::CHW; break;
-        case 4: layout = InferenceEngine::Layout::NCHW; break;
-        case 5: layout = InferenceEngine::Layout::NCDHW; break;
-        case 6: layout = InferenceEngine::Layout::GOIDHW; break;
-        default: IE_THROW() << "Can't convert dims " << shape.size() << " to Layout!";
-        }
+namespace {
+InferenceEngine::Blob::Ptr fill_blob(InferenceEngine::SizeVector shape,
+                                     const void* data,
+                                     size_t data_size,
+                                     const element::Type& elem_type) {
+    InferenceEngine::Layout layout;
+    switch (shape.size()) {
+    case 0:
+        layout = InferenceEngine::Layout::SCALAR;
+        break;
+    case 1:
+        layout = InferenceEngine::Layout::C;
+        break;
+    case 2:
+        layout = InferenceEngine::Layout::NC;
+        break;
+    case 3:
+        layout = InferenceEngine::Layout::CHW;
+        break;
+    case 4:
+        layout = InferenceEngine::Layout::NCHW;
+        break;
+    case 5:
+        layout = InferenceEngine::Layout::NCDHW;
+        break;
+    case 6:
+        layout = InferenceEngine::Layout::GOIDHW;
+        break;
+    default:
+        IE_THROW() << "Can't convert dims " << shape.size() << " to Layout!";
+    }
 
-        InferenceEngine::MemoryBlob::Ptr blob;
+    InferenceEngine::MemoryBlob::Ptr blob;
 
-#define MAKE_IE_TBLOB(type_, precision_, shape_, layout_)                                          \
-    make_shared<InferenceEngine::TBlob<type_>>(                                                    \
+#define MAKE_IE_TBLOB(type_, precision_, shape_, layout_) \
+    make_shared<InferenceEngine::TBlob<type_>>(           \
         InferenceEngine::TensorDesc{InferenceEngine::Precision::precision_, shape_, layout_})
 
-        switch (elem_type)
-        {
-        case element::Type_t::f32: blob = MAKE_IE_TBLOB(float, FP32, shape, layout); break;
-        case element::Type_t::f64: blob = MAKE_IE_TBLOB(double, FP64, shape, layout); break;
-        case element::Type_t::i16: blob = MAKE_IE_TBLOB(int16_t, I16, shape, layout); break;
-        case element::Type_t::u8: blob = MAKE_IE_TBLOB(uint8_t, U8, shape, layout); break;
-        case element::Type_t::i8: blob = MAKE_IE_TBLOB(int8_t, I8, shape, layout); break;
-        case element::Type_t::u16: blob = MAKE_IE_TBLOB(uint16_t, U16, shape, layout); break;
-        case element::Type_t::i32: blob = MAKE_IE_TBLOB(int32_t, I32, shape, layout); break;
-        case element::Type_t::u32: blob = MAKE_IE_TBLOB(uint32_t, U32, shape, layout); break;
-        case element::Type_t::i64: blob = MAKE_IE_TBLOB(int64_t, I64, shape, layout); break;
-        case element::Type_t::u64: blob = MAKE_IE_TBLOB(uint64_t, U64, shape, layout); break;
-        case element::Type_t::boolean: blob = MAKE_IE_TBLOB(uint8_t, BOOL, shape, layout); break;
-        default: IE_THROW() << "Can't convert type " << elem_type << " to IE Precision!";
-        }
+    switch (elem_type) {
+    case element::Type_t::f32:
+        blob = MAKE_IE_TBLOB(float, FP32, shape, layout);
+        break;
+    case element::Type_t::f64:
+        blob = MAKE_IE_TBLOB(double, FP64, shape, layout);
+        break;
+    case element::Type_t::i16:
+        blob = MAKE_IE_TBLOB(int16_t, I16, shape, layout);
+        break;
+    case element::Type_t::u8:
+        blob = MAKE_IE_TBLOB(uint8_t, U8, shape, layout);
+        break;
+    case element::Type_t::i8:
+        blob = MAKE_IE_TBLOB(int8_t, I8, shape, layout);
+        break;
+    case element::Type_t::u16:
+        blob = MAKE_IE_TBLOB(uint16_t, U16, shape, layout);
+        break;
+    case element::Type_t::i32:
+        blob = MAKE_IE_TBLOB(int32_t, I32, shape, layout);
+        break;
+    case element::Type_t::u32:
+        blob = MAKE_IE_TBLOB(uint32_t, U32, shape, layout);
+        break;
+    case element::Type_t::i64:
+        blob = MAKE_IE_TBLOB(int64_t, I64, shape, layout);
+        break;
+    case element::Type_t::u64:
+        blob = MAKE_IE_TBLOB(uint64_t, U64, shape, layout);
+        break;
+    case element::Type_t::boolean:
+        blob = MAKE_IE_TBLOB(uint8_t, BOOL, shape, layout);
+        break;
+    default:
+        IE_THROW() << "Can't convert type " << elem_type << " to IE Precision!";
+    }
 #undef MAKE_IE_TBLOB
 
-        blob->allocate();
-        uint8_t* blob_ptr = blob->rwmap().as<uint8_t*>();
-        memcpy(blob_ptr, data, data_size * elem_type.size());
-        return blob;
-    }
-} // namespace
+    blob->allocate();
+    uint8_t* blob_ptr = blob->rwmap().as<uint8_t*>();
+    memcpy(blob_ptr, data, data_size * elem_type.size());
+    return blob;
+}
+}  // namespace
 
-namespace
-{
-    std::set<NodeTypeInfo> get_ie_ops()
-    {
-        std::set<NodeTypeInfo> ie_ops = get_opset1().get_type_info_set();
-        auto& opset2 = get_opset2().get_type_info_set();
-        ie_ops.insert(opset2.begin(), opset2.end());
-        auto& opset3 = get_opset3().get_type_info_set();
-        ie_ops.insert(opset3.begin(), opset3.end());
-        auto& opset4 = get_opset4().get_type_info_set();
-        ie_ops.insert(opset4.begin(), opset4.end());
-        auto& opset5 = get_opset5().get_type_info_set();
-        ie_ops.insert(opset5.begin(), opset5.end());
-        auto& opset6 = get_opset6().get_type_info_set();
-        ie_ops.insert(opset6.begin(), opset6.end());
-        auto& opset7 = get_opset7().get_type_info_set();
-        ie_ops.insert(opset7.begin(), opset7.end());
-        return ie_ops;
-    }
-} // namespace
+namespace {
+std::set<NodeTypeInfo> get_ie_ops() {
+    std::set<NodeTypeInfo> ie_ops = get_opset1().get_type_info_set();
+    auto& opset2 = get_opset2().get_type_info_set();
+    ie_ops.insert(opset2.begin(), opset2.end());
+    auto& opset3 = get_opset3().get_type_info_set();
+    ie_ops.insert(opset3.begin(), opset3.end());
+    auto& opset4 = get_opset4().get_type_info_set();
+    ie_ops.insert(opset4.begin(), opset4.end());
+    auto& opset5 = get_opset5().get_type_info_set();
+    ie_ops.insert(opset5.begin(), opset5.end());
+    auto& opset6 = get_opset6().get_type_info_set();
+    ie_ops.insert(opset6.begin(), opset6.end());
+    auto& opset7 = get_opset7().get_type_info_set();
+    ie_ops.insert(opset7.begin(), opset7.end());
+    return ie_ops;
+}
+}  // namespace
 
-runtime::ie::IE_Executable::IE_Executable(shared_ptr<Function> func, string device)
-    : m_device{device}
-{
+runtime::ie::IE_Executable::IE_Executable(shared_ptr<Function> func, string device) : m_device{device} {
     static std::set<NodeTypeInfo> ie_ops = get_ie_ops();
 
-    for (const auto& node : func->get_ops())
-    {
-        if (ie_ops.find(node->get_type_info()) == ie_ops.end())
-        {
+    for (const auto& node : func->get_ops()) {
+        if (ie_ops.find(node->get_type_info()) == ie_ops.end()) {
             cout << "UNSUPPORTED OP DETECTED: " << node->get_type_info().name << endl;
             IE_THROW() << "Detected op not belonging to opset1!";
         }
     }
 
-#ifdef NGRAPH_DEBUG_ENABLE
+#ifdef OPENVINO_DEBUG_ENABLE
     cout << "Nodes in test: ";
-    for (const auto& node : func->get_ops())
-    {
+    for (const auto& node : func->get_ops()) {
         cout << node << endl;
     }
     cout << endl;
@@ -113,8 +141,7 @@ runtime::ie::IE_Executable::IE_Executable(shared_ptr<Function> func, string devi
 }
 
 bool runtime::ie::IE_Executable::call(const vector<shared_ptr<runtime::Tensor>>& outputs,
-                                      const vector<shared_ptr<runtime::Tensor>>& inputs)
-{
+                                      const vector<shared_ptr<runtime::Tensor>>& inputs) {
     InferenceEngine::Core ie;
 
     //  Loading model to the plugin (BACKEND_NAME)
@@ -124,16 +151,13 @@ bool runtime::ie::IE_Executable::call(const vector<shared_ptr<runtime::Tensor>>&
     //  Prepare input and output blobs
     InferenceEngine::InputsDataMap input_info = m_network.getInputsInfo();
 
-    if (input_info.size() != inputs.size())
-    {
+    if (input_info.size() != inputs.size()) {
         IE_THROW() << "Function inputs number differ from number of given inputs";
     }
 
     size_t i = 0;
-    for (const auto& it : input_info)
-    {
-        shared_ptr<runtime::ie::IETensor> tv =
-            static_pointer_cast<runtime::ie::IETensor>(inputs[i]);
+    for (const auto& it : input_info) {
+        shared_ptr<runtime::ie::IETensor> tv = static_pointer_cast<runtime::ie::IETensor>(inputs[i]);
         infer_request.SetBlob(it.first,
                               fill_blob(it.second->getTensorDesc().getDims(),
                                         tv->get_data_ptr(),
@@ -151,10 +175,8 @@ bool runtime::ie::IE_Executable::call(const vector<shared_ptr<runtime::Tensor>>&
     infer_request.Infer();
     InferenceEngine::Blob::Ptr output = infer_request.GetBlob(output_name);
 
-    InferenceEngine::MemoryBlob::Ptr moutput =
-        InferenceEngine::as<InferenceEngine::MemoryBlob>(output);
-    if (!moutput)
-    {
+    InferenceEngine::MemoryBlob::Ptr moutput = InferenceEngine::as<InferenceEngine::MemoryBlob>(output);
+    if (!moutput) {
         IE_THROW() << "Cannot get output MemoryBlob in call_with_validate()";
     }
 
diff --git a/ngraph/test/threading.cpp b/ngraph/test/threading.cpp
new file mode 100644
index 00000000000..bd0df73a5b8
--- /dev/null
+++ b/ngraph/test/threading.cpp
@@ -0,0 +1,62 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <mutex>
+#include <thread>
+#include <vector>
+
+#include "gtest/gtest.h"
+#include "ngraph/ngraph.hpp"
+
+using namespace ngraph;
+using namespace std;
+
+TEST(threading, get_friendly_name) {
+    const size_t number = 20;
+    Shape shape{};
+    auto a = make_shared<op::Parameter>(element::i32, shape);
+    auto iconst0 = op::Constant::create(element::i32, Shape{}, {0});
+    auto add_a1 = make_shared<op::v1::Add>(a, iconst0);
+    auto add_a2 = make_shared<op::v1::Add>(add_a1, iconst0);
+    auto add_a3 = make_shared<op::v1::Add>(add_a2, iconst0);
+    auto abs_add_a3 = std::make_shared<op::Abs>(add_a3);
+
+    auto b = make_shared<op::Parameter>(element::i32, shape);
+    auto add_b1 = make_shared<op::v1::Add>(b, iconst0);
+    auto add_b2 = make_shared<op::v1::Add>(add_b1, iconst0);
+    auto abs_add_b2 = std::make_shared<op::Abs>(add_b2);
+
+    auto graph = make_shared<op::v1::Multiply>(abs_add_a3, abs_add_b2);
+
+    auto f = std::make_shared<Function>(ngraph::NodeVector{graph}, ParameterVector{a, b});
+
+    const auto compare_names = [](const std::vector<std::string>& names) {
+        static std::unordered_set<std::string> ref_names;
+        static std::once_flag flag;
+        std::call_once(flag, [&]() {
+            for (const auto& name : names)
+                ref_names.insert(name);
+        });
+        for (const auto& name : names) {
+            ASSERT_TRUE(ref_names.count(name));
+        }
+    };
+
+    const auto get_friendly_name = [&](const std::shared_ptr<ngraph::Function>& f) {
+        std::vector<std::string> names;
+        for (const auto& op : f->get_ops()) {
+            names.emplace_back(op->get_friendly_name());
+        }
+        compare_names(names);
+    };
+
+    std::vector<std::thread> threads(number);
+
+    for (auto&& thread : threads)
+        thread = std::thread(get_friendly_name, f);
+
+    for (auto&& th : threads) {
+        th.join();
+    }
+}
diff --git a/ngraph/test/type_info.cpp b/ngraph/test/type_info.cpp
new file mode 100644
index 00000000000..45b2ae47d89
--- /dev/null
+++ b/ngraph/test/type_info.cpp
@@ -0,0 +1,49 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include "openvino/core/type.hpp"
+
+TEST(type_info, compare_old_type) {
+    ov::DiscreteTypeInfo type1("type1", 0);
+    ov::DiscreteTypeInfo type2("type2", 0);
+    ov::DiscreteTypeInfo type3("type1", 1);
+    ov::DiscreteTypeInfo type4("type3", 0, &type1);
+    ov::DiscreteTypeInfo type5("type3", 0, &type2);
+    ASSERT_TRUE(type1 != type2);
+    ASSERT_TRUE(type1 == type1);
+    ASSERT_TRUE(type1 < type2);
+    ASSERT_TRUE(type2 > type1);
+    ASSERT_TRUE(type1 >= type1);
+    ASSERT_TRUE(type1 <= type1);
+    ASSERT_TRUE(type3 >= type1);
+    ASSERT_TRUE(type1 <= type3);
+    ASSERT_FALSE(type4 != type5);
+    ASSERT_FALSE(type4 < type5);
+}
+
+TEST(type_info, compare_new_type) {
+    ov::DiscreteTypeInfo type1("type1", 0, "version1");
+    ov::DiscreteTypeInfo type2("type2", 0, "version1");
+    ov::DiscreteTypeInfo type3("type1", 1, "version2");
+    ov::DiscreteTypeInfo type4("type3", 0, "version3", &type1);
+    ov::DiscreteTypeInfo type5("type3", 0, "version3", &type2);
+    ASSERT_TRUE(type1 != type2);
+    ASSERT_TRUE(type1 == type1);
+    ASSERT_TRUE(type1 < type2);
+    ASSERT_TRUE(type2 > type1);
+    ASSERT_TRUE(type1 >= type1);
+    ASSERT_TRUE(type1 <= type1);
+    ASSERT_TRUE(type3 >= type1);
+    ASSERT_TRUE(type1 <= type3);
+    ASSERT_FALSE(type4 != type5);
+    ASSERT_FALSE(type4 < type5);
+}
+
+TEST(type_info, compare_new_with_old_type) {
+    ov::DiscreteTypeInfo type1("type1", 0, "version1");
+    ov::DiscreteTypeInfo type1_o("type1", 0);
+    ASSERT_TRUE(type1 == type1_o);
+}
diff --git a/ngraph/test/type_prop/parameter.cpp b/ngraph/test/type_prop/parameter.cpp
index 78756655deb..f758f13c415 100644
--- a/ngraph/test/type_prop/parameter.cpp
+++ b/ngraph/test/type_prop/parameter.cpp
@@ -30,3 +30,20 @@ TEST(type_prop, param_partial_rank_static) {
     ASSERT_TRUE(pshape[2].is_static() && pshape[2].get_length() == 3);
     ASSERT_TRUE(pshape[3].is_static() && pshape[3].get_length() == 4);
 }
+
+TEST(type_prop, param_layout) {
+    auto a = make_shared<op::Parameter>(element::f32, PartialShape::dynamic());
+    a->set_layout("NHWC");
+    ASSERT_EQ(a->get_layout(), "NHWC");
+}
+
+TEST(type_prop, param_layout_empty) {
+    auto a = make_shared<op::Parameter>(element::f32, PartialShape::dynamic());
+    ASSERT_EQ(a->get_layout(), ov::Layout());
+}
+
+TEST(type_prop, param_layout_invalid) {
+    auto a = make_shared<op::Parameter>(element::f32, PartialShape::dynamic());
+    a->get_output_tensor(0).get_rt_info()["LAYOUT"] = ov::make_variant("NCHW");  // incorrect way
+    ASSERT_THROW(a->get_layout(), ov::AssertFailure);
+}
diff --git a/openvino/CMakeLists.txt b/openvino/CMakeLists.txt
index a5b9d3ef7bd..e13df8efbf0 100644
--- a/openvino/CMakeLists.txt
+++ b/openvino/CMakeLists.txt
@@ -5,5 +5,6 @@
 add_subdirectory(pp)
 add_subdirectory(itt)
 add_subdirectory(conditional_compilation)
+add_subdirectory(util)
 
 openvino_developer_export_targets(COMPONENT openvino_common TARGETS openvino::pp openvino::itt openvino::conditional_compilation)
diff --git a/openvino/util/.clang-format b/openvino/util/.clang-format
new file mode 100644
index 00000000000..ebe747b7838
--- /dev/null
+++ b/openvino/util/.clang-format
@@ -0,0 +1,28 @@
+BasedOnStyle: Google
+IndentWidth: 4
+UseTab: Never
+ColumnLimit: 120
+
+Language: Cpp
+Standard: Cpp11
+
+AccessModifierOffset: -4
+AlignConsecutiveMacros: true
+AllowAllArgumentsOnNextLine: false
+AllowAllConstructorInitializersOnNextLine: false
+AllowAllParametersOfDeclarationOnNextLine: false
+AllowShortFunctionsOnASingleLine: Empty
+AllowShortIfStatementsOnASingleLine: Never
+AllowShortLambdasOnASingleLine: Empty
+AllowShortLoopsOnASingleLine: false
+AlwaysBreakBeforeMultilineStrings: false
+BinPackArguments: false
+BinPackParameters: false
+CommentPragmas: '^#'
+DerivePointerAlignment: false
+FixNamespaceComments: true
+IndentCaseLabels: false
+IndentPPDirectives: AfterHash
+ForEachMacros:
+  - foreach
+  - FOREACH_CHILD
diff --git a/openvino/util/CMakeLists.txt b/openvino/util/CMakeLists.txt
new file mode 100644
index 00000000000..2a9c7dd91cd
--- /dev/null
+++ b/openvino/util/CMakeLists.txt
@@ -0,0 +1,30 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+set(TARGET_NAME util)
+
+file(GLOB_RECURSE LIBRARY_SRC ${CMAKE_CURRENT_SOURCE_DIR}/src/*.cpp)
+file(GLOB_RECURSE PUBLIC_HEADERS ${CMAKE_CURRENT_SOURCE_DIR}/include/*.hpp)
+
+set(UTIL_INCLUDE_DIR ${CMAKE_CURRENT_SOURCE_DIR}/include/)
+
+# Create named folders for the sources within the .vcproj
+# Empty name lists them directly under the .vcproj
+
+source_group("src" FILES ${LIBRARY_SRC})
+source_group("include" FILES ${PUBLIC_HEADERS})
+
+# Create shared library
+add_library(${TARGET_NAME} STATIC ${LIBRARY_SRC} ${PUBLIC_HEADERS})
+
+add_library(openvino::util ALIAS ${TARGET_NAME})
+
+target_link_libraries(${TARGET_NAME} PRIVATE ${CMAKE_DL_LIBS})
+target_include_directories(${TARGET_NAME} PUBLIC ${UTIL_INCLUDE_DIR})
+
+add_clang_format_target(${TARGET_NAME}_clang FOR_TARGETS ${TARGET_NAME})
+ov_ncc_naming_style(FOR_TARGET ${TARGET_NAME}
+                    INCLUDE_DIRECTORY ${UTIL_INCLUDE_DIR})
+
+openvino_developer_export_targets(COMPONENT openvino_common TARGETS ${TARGET_NAME})
diff --git a/openvino/util/include/openvino/util/common_util.hpp b/openvino/util/include/openvino/util/common_util.hpp
new file mode 100644
index 00000000000..6c519f06611
--- /dev/null
+++ b/openvino/util/include/openvino/util/common_util.hpp
@@ -0,0 +1,101 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <algorithm>
+#include <cstring>
+#include <sstream>
+#include <string>
+#include <vector>
+
+namespace ov {
+namespace util {
+
+template <typename T>
+std::string join(const T& v, const std::string& sep = ", ") {
+    std::ostringstream ss;
+    size_t count = 0;
+    for (const auto& x : v) {
+        if (count++ > 0) {
+            ss << sep;
+        }
+        ss << x;
+    }
+    return ss.str();
+}
+
+template <typename T>
+std::string vector_to_string(const T& v) {
+    std::ostringstream os;
+    os << "[ " << ov::util::join(v) << " ]";
+    return os.str();
+}
+
+std::string to_lower(const std::string& s);
+
+std::string to_upper(const std::string& s);
+
+/**
+ * @brief trim from start (in place)
+ * @param s - string to trim
+ */
+inline std::string ltrim(const std::string& s) {
+    std::string ret = s;
+    ret.erase(ret.begin(), std::find_if(ret.begin(), ret.end(), [](int c) {
+                  return !std::isspace(c);
+              }));
+    return ret;
+}
+
+/**
+ * @brief trim from end (in place)
+ * @param s - string to trim
+ */
+inline std::string rtrim(const std::string& s) {
+    std::string ret = s;
+    ret.erase(std::find_if(ret.rbegin(),
+                           ret.rend(),
+                           [](int c) {
+                               return !std::isspace(c);
+                           })
+                  .base(),
+              ret.end());
+    return ret;
+}
+
+/**
+ * @brief Trims std::string from both ends (in place)
+ * @ingroup ie_dev_api_error_debug
+ * @param s A reference to a std::tring to trim
+ * @return A reference to a trimmed std::string
+ */
+inline std::string trim(const std::string& s) {
+    std::string ret = ltrim(s);
+    ret = rtrim(ret);
+    return ret;
+}
+
+/**
+ * @brief check string end with given substring
+ * @param src - string to check
+ * @param with - given substring
+ * @return true if string end with given substring
+ */
+inline bool ends_with(const std::string& src, const char* with) {
+    int wl = static_cast<int>(strlen(with));
+    int so = static_cast<int>(src.length()) - wl;
+    if (so < 0)
+        return false;
+    return 0 == strncmp(with, &src[so], wl);
+}
+
+std::vector<std::string> split(const std::string& s, char delimiter, bool trim = false);
+
+template <typename T>
+T ceil_div(const T& x, const T& y) {
+    return (x == 0 ? 0 : (1 + (x - 1) / y));
+}
+}  // namespace util
+}  // namespace ov
diff --git a/openvino/util/include/openvino/util/env_util.hpp b/openvino/util/include/openvino/util/env_util.hpp
new file mode 100644
index 00000000000..14ca064e121
--- /dev/null
+++ b/openvino/util/include/openvino/util/env_util.hpp
@@ -0,0 +1,34 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <string>
+
+namespace ov {
+namespace util {
+/// \brief Get the names environment variable as a string.
+/// \param env_var The string name of the environment variable to get.
+/// \return Returns string by value or an empty string if the environment
+///         variable is not set.
+std::string getenv_string(const char* env_var);
+
+/// \brief Get the names environment variable as an integer. If the value is not a
+///        valid integer then an exception is thrown.
+/// \param env_var The string name of the environment variable to get.
+/// \param default_value The value to return if the environment variable is not set.
+/// \return Returns value or default_value if the environment variable is not set.
+int32_t getenv_int(const char* env_var, int32_t default_value = -1);
+
+/// \brief Get the names environment variable as a boolean. If the value is not a
+///        valid boolean then an exception is thrown. Valid booleans are one of
+///        1, 0, on, off, true, false
+///        All values are case insensitive.
+///        If the environment variable is not set the default_value is returned.
+/// \param env_var The string name of the environment variable to get.
+/// \param default_value The value to return if the environment variable is not set.
+/// \return Returns the boolean value of the environment variable.
+bool getenv_bool(const char* env_var, bool default_value = false);
+}  // namespace util
+}  // namespace ov
diff --git a/openvino/util/include/openvino/util/file_util.hpp b/openvino/util/include/openvino/util/file_util.hpp
new file mode 100644
index 00000000000..f8d2014cba9
--- /dev/null
+++ b/openvino/util/include/openvino/util/file_util.hpp
@@ -0,0 +1,251 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <fstream>
+#include <functional>
+#include <string>
+#include <vector>
+
+#ifndef ENABLE_UNICODE_PATH_SUPPORT
+#    ifdef _WIN32
+#        if defined __INTEL_COMPILER || defined _MSC_VER
+#            define ENABLE_UNICODE_PATH_SUPPORT
+#        endif
+#    elif defined(__GNUC__) && (__GNUC__ > 5 || (__GNUC__ == 5 && __GNUC_MINOR__ > 2)) || defined(__clang__)
+#        define ENABLE_UNICODE_PATH_SUPPORT
+#    endif
+#endif
+
+namespace ov {
+namespace util {
+
+/// OS specific file traits
+template <class C>
+struct FileTraits;
+
+template <>
+struct FileTraits<char> {
+    static constexpr const auto file_separator =
+#ifdef _WIN32
+        '\\';
+#else
+        '/';
+#endif
+    static constexpr const auto dot_symbol = '.';
+    static std::string library_ext() {
+#ifdef _WIN32
+        return {"dll"};
+#else
+        return {"so"};
+#endif
+    }
+    static std::string library_prefix() {
+#ifdef _WIN32
+        return {""};
+#else
+        return {"lib"};
+#endif
+    }
+};
+
+template <>
+struct FileTraits<wchar_t> {
+    static constexpr const auto file_separator =
+#ifdef _WIN32
+        L'\\';
+#else
+        L'/';
+#endif
+    static constexpr const auto dot_symbol = L'.';
+    static std::wstring library_ext() {
+#ifdef _WIN32
+        return {L"dll"};
+#else
+        return {L"so"};
+#endif
+    }
+    static std::wstring library_prefix() {
+#ifdef _WIN32
+        return {L""};
+#else
+        return {L"lib"};
+#endif
+    }
+};
+
+#ifdef ENABLE_UNICODE_PATH_SUPPORT
+/**
+ * @brief Conversion from wide character string to a single-byte chain.
+ * @param wstr A wide-char string
+ * @return A multi-byte string
+ */
+std::string wstring_to_string(const std::wstring& wstr);
+/**
+ * @brief Conversion from single-byte chain to wide character string.
+ * @param str A null-terminated string
+ * @return A wide-char string
+ */
+std::wstring string_to_wstring(const std::string& str);
+
+#endif
+
+/// \brief Remove path components which would allow traversing up a directory tree.
+/// \param path A path to file
+/// \return A sanitiazed path
+std::string sanitize_path(const std::string& path);
+
+/// \brief Returns the name with extension for a given path
+/// \param path The path to the output file
+std::string get_file_name(const std::string& path);
+
+/**
+ * @brief Interface function to get absolute path of file
+ * @param path - path to file, can be relative to current working directory
+ * @return Absolute path of file
+ * @throw runtime_exception if any error occurred
+ */
+std::string get_absolute_file_path(const std::string& path);
+/**
+ * @brief Interface function to create directorty recursively by given path
+ * @param path - path to file, can be relative to current working directory
+ * @throw runtime_exception if any error occurred
+ */
+void create_directory_recursive(const std::string& path);
+
+/**
+ * @brief Interface function to check if directory exists for given path
+ * @param path - path to directory
+ * @return true if directory exists, false otherwise
+ */
+bool directory_exists(const std::string& path);
+
+/**
+ * @brief      Returns file size for file
+ * @param[in]  path  The file name
+ * @return     file size
+ */
+inline uint64_t file_size(const char* path) {
+#if defined(ENABLE_UNICODE_PATH_SUPPORT) && defined(_WIN32)
+    std::wstring widefilename = ov::util::string_to_wstring(path);
+    const wchar_t* file_name = widefilename.c_str();
+#elif defined(__ANDROID__) || defined(ANDROID)
+    std::string file_name = path;
+    std::string::size_type pos = file_name.find('!');
+    if (pos != std::string::npos) {
+        file_name = file_name.substr(0, pos);
+    }
+#else
+    const char* file_name = path;
+#endif
+    std::ifstream in(file_name, std::ios_base::binary | std::ios_base::ate);
+    return in.tellg();
+}
+
+#ifdef ENABLE_UNICODE_PATH_SUPPORT
+
+/**
+ * @brief      Returns file size for file
+ * @param[in]  path  The file name
+ * @return     file size
+ */
+inline uint64_t file_size(const std::wstring& path) {
+    return file_size(wstring_to_string(path).c_str());
+}
+
+#endif  // ENABLE_UNICODE_PATH_SUPPORT
+
+/**
+ * @brief      Returns file size for file
+ * @param[in]  path  The file name
+ * @return     file size
+ */
+inline uint64_t file_size(const std::string& path) {
+    return file_size(path.c_str());
+}
+
+/**
+ * @brief      Returns true if file exists
+ * @param[in]  path  The path to file
+ * @return     true if file exists
+ */
+template <typename C,
+          typename = typename std::enable_if<(std::is_same<C, char>::value || std::is_same<C, wchar_t>::value)>::type>
+inline bool file_exists(const std::basic_string<C>& path) {
+    return file_size(path) > 0;
+}
+
+std::string get_file_ext(const std::string& path);
+std::string get_directory(const std::string& path);
+std::string path_join(const std::vector<std::string>& paths);
+
+void iterate_files(const std::string& path,
+                   const std::function<void(const std::string& file, bool is_dir)>& func,
+                   bool recurse = false,
+                   bool include_links = false);
+
+void convert_path_win_style(std::string& path);
+
+std::string get_ov_lib_path();
+
+#ifdef ENABLE_UNICODE_PATH_SUPPORT
+
+using FilePath = std::wstring;
+
+inline std::string from_file_path(const FilePath& path) {
+    return wstring_to_string(path);
+}
+
+inline FilePath to_file_path(const std::string& path) {
+    return string_to_wstring(path);
+}
+
+#else
+
+using FilePath = std::string;
+
+inline std::string from_file_path(const FilePath& path) {
+    return path;
+}
+
+inline FilePath to_file_path(const std::string& path) {
+    return path;
+}
+
+#endif  // ENABLE_UNICODE_PATH_SUPPORT
+
+#ifdef ENABLE_UNICODE_PATH_SUPPORT
+
+/**
+ * @brief   Returns a unicode path to openvino libraries
+ * @return  A `std::wstring` path to openvino libraries
+ */
+std::wstring get_ov_lib_path_w();
+
+inline std::wstring get_ov_library_path() {
+    return get_ov_lib_path_w();
+}
+
+#else
+
+inline std::string get_ov_library_path() {
+    return get_ov_lib_path();
+}
+
+#endif  // ENABLE_UNICODE_PATH_SUPPORT
+
+template <typename C,
+          typename = typename std::enable_if<(std::is_same<C, char>::value || std::is_same<C, wchar_t>::value)>::type>
+inline std::basic_string<C> make_plugin_library_name(const std::basic_string<C>& path,
+                                                     const std::basic_string<C>& input) {
+    std::basic_string<C> separator(1, FileTraits<C>::file_separator);
+    if (path.empty())
+        separator = {};
+    return path + separator + FileTraits<C>::library_prefix() + input + FileTraits<C>::dot_symbol +
+           FileTraits<C>::library_ext();
+}
+
+}  // namespace util
+}  // namespace ov
diff --git a/openvino/util/include/openvino/util/log.hpp b/openvino/util/include/openvino/util/log.hpp
new file mode 100644
index 00000000000..aca1e0150f5
--- /dev/null
+++ b/openvino/util/include/openvino/util/log.hpp
@@ -0,0 +1,144 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <deque>
+#include <functional>
+#include <sstream>
+#include <vector>
+
+namespace ov {
+namespace util {
+class ConstString {
+public:
+    template <size_t SIZE>
+    constexpr ConstString(const char (&p)[SIZE]) : m_string(p),
+                                                   m_size(SIZE) {}
+
+    constexpr char operator[](size_t i) const {
+        return i < m_size ? m_string[i] : throw std::out_of_range("");
+    }
+    constexpr const char* get_ptr(size_t offset) const {
+        return offset < m_size ? &m_string[offset] : m_string;
+    }
+    constexpr size_t size() const {
+        return m_size;
+    }
+
+private:
+    const char* m_string;
+    size_t m_size;
+};
+
+constexpr const char* find_last(ConstString s, size_t offset, char ch) {
+    return offset == 0 ? s.get_ptr(0) : (s[offset] == ch ? s.get_ptr(offset + 1) : find_last(s, offset - 1, ch));
+}
+
+constexpr const char* find_last(ConstString s, char ch) {
+    return find_last(s, s.size() - 1, ch);
+}
+
+constexpr const char* get_file_name(ConstString s) {
+    return find_last(s, '/');
+}
+constexpr const char* trim_file_name(ConstString root, ConstString s) {
+    return s.get_ptr(root.size());
+}
+enum class LOG_TYPE {
+    _LOG_TYPE_ERROR,
+    _LOG_TYPE_WARNING,
+    _LOG_TYPE_INFO,
+    _LOG_TYPE_DEBUG,
+};
+
+class LogHelper {
+public:
+    LogHelper(LOG_TYPE, const char* file, int line, std::function<void(const std::string&)> m_handler_func);
+    ~LogHelper();
+
+    std::ostream& stream() {
+        return m_stream;
+    }
+
+private:
+    std::function<void(const std::string&)> m_handler_func;
+    std::stringstream m_stream;
+};
+
+class Logger {
+    friend class LogHelper;
+
+public:
+    static void set_log_path(const std::string& path);
+    static void start();
+    static void stop();
+
+private:
+    static void log_item(const std::string& s);
+    static void process_event(const std::string& s);
+    static void thread_entry(void* param);
+    static std::string m_log_path;
+    static std::deque<std::string> m_queue;
+};
+
+void default_logger_handler_func(const std::string& s);
+
+#ifndef PROJECT_ROOT_DIR
+#    define PROJECT_ROOT_DIR ""
+#endif
+
+#define OPENVINO_ERR                                                              \
+    ::ov::util::LogHelper(::ov::util::LOG_TYPE::_LOG_TYPE_ERROR,                  \
+                          ::ov::util::trim_file_name(PROJECT_ROOT_DIR, __FILE__), \
+                          __LINE__,                                               \
+                          ::ov::util::default_logger_handler_func)                \
+        .stream()
+
+#define OPENVINO_WARN                                                             \
+    ::ov::util::LogHelper(::ov::util::LOG_TYPE::_LOG_TYPE_WARNING,                \
+                          ::ov::util::trim_file_name(PROJECT_ROOT_DIR, __FILE__), \
+                          __LINE__,                                               \
+                          ::ov::util::default_logger_handler_func)                \
+        .stream()
+
+#define OPENVINO_INFO                                                             \
+    ::ov::util::LogHelper(::ov::util::LOG_TYPE::_LOG_TYPE_INFO,                   \
+                          ::ov::util::trim_file_name(PROJECT_ROOT_DIR, __FILE__), \
+                          __LINE__,                                               \
+                          ::ov::util::default_logger_handler_func)                \
+        .stream()
+
+#ifdef OPENVINO_DEBUG_ENABLE
+#    define OPENVINO_DEBUG                                                            \
+        ::ov::util::LogHelper(::ov::util::LOG_TYPE::_LOG_TYPE_DEBUG,                  \
+                              ::ov::util::trim_file_name(PROJECT_ROOT_DIR, __FILE__), \
+                              __LINE__,                                               \
+                              ::ov::util::default_logger_handler_func)                \
+            .stream()
+#else
+
+struct NullLogger {};
+
+template <typename T>
+NullLogger&& operator<<(NullLogger&& logger, T&&) {
+    return std::move(logger);
+}
+
+template <typename T>
+NullLogger&& operator<<(NullLogger&& logger, const T&) {
+    return std::move(logger);
+}
+
+inline NullLogger&& operator<<(
+    NullLogger&& logger,
+    std::basic_ostream<char, std::char_traits<char>>& (&)(std::basic_ostream<char, std::char_traits<char>>&)) {
+    return std::move(logger);
+}
+
+#    define OPENVINO_DEBUG \
+        ::ov::util::NullLogger {}
+#endif
+}  // namespace util
+}  // namespace ov
diff --git a/openvino/util/src/common_util.cpp b/openvino/util/src/common_util.cpp
new file mode 100644
index 00000000000..b3aba13d41f
--- /dev/null
+++ b/openvino/util/src/common_util.cpp
@@ -0,0 +1,42 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "openvino/util/common_util.hpp"
+
+#include <algorithm>
+
+std::string ov::util::to_lower(const std::string& s) {
+    std::string rc = s;
+    std::transform(rc.begin(), rc.end(), rc.begin(), ::tolower);
+    return rc;
+}
+
+std::string ov::util::to_upper(const std::string& s) {
+    std::string rc = s;
+    std::transform(rc.begin(), rc.end(), rc.begin(), ::toupper);
+    return rc;
+}
+
+std::vector<std::string> ov::util::split(const std::string& src, char delimiter, bool do_trim) {
+    size_t pos;
+    std::string token;
+    size_t start = 0;
+    std::vector<std::string> rc;
+    while ((pos = src.find(delimiter, start)) != std::string::npos) {
+        token = src.substr(start, pos - start);
+        start = pos + 1;
+        if (do_trim) {
+            token = trim(token);
+        }
+        rc.push_back(token);
+    }
+    if (start <= src.size()) {
+        token = src.substr(start);
+        if (do_trim) {
+            token = trim(token);
+        }
+        rc.push_back(token);
+    }
+    return rc;
+}
diff --git a/openvino/util/src/env_util.cpp b/openvino/util/src/env_util.cpp
new file mode 100644
index 00000000000..eb005fdedeb
--- /dev/null
+++ b/openvino/util/src/env_util.cpp
@@ -0,0 +1,65 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "openvino/util/env_util.hpp"
+
+#include <set>
+#include <sstream>
+
+#include "openvino/util/common_util.hpp"
+#include "openvino/util/log.hpp"
+
+std::string ov::util::getenv_string(const char* env_var) {
+    const char* env_p = ::getenv(env_var);
+    return env_p != nullptr ? std::string(env_p) : "";
+}
+
+int32_t ov::util::getenv_int(const char* env_var, int32_t default_value) {
+    const char* env_p = ::getenv(env_var);
+    int32_t env = default_value;
+    // If env_var is not "" or undefined
+    if (env_p && *env_p) {
+        errno = 0;
+        char* err;
+        env = strtol(env_p, &err, 0);
+        // if conversion leads to an overflow
+        if (errno) {
+            std::stringstream ss;
+            ss << "Environment variable \"" << env_var << "\"=\"" << env_p << "\" converted to different value \""
+               << env << "\" due to overflow." << std::endl;
+            throw std::runtime_error(ss.str());
+        }
+        // if syntax error is there - conversion will still happen
+        // but warn user of syntax error
+        if (*err) {
+            std::stringstream ss;
+            ss << "Environment variable \"" << env_var << "\"=\"" << env_p << "\" converted to different value \""
+               << env << "\" due to syntax error \"" << err << '\"' << std::endl;
+            throw std::runtime_error(ss.str());
+        }
+    } else {
+        OPENVINO_DEBUG << "Environment variable (" << env_var << ") empty or undefined, "
+                       << " defaulted to " << default_value << " here.";
+    }
+    return env;
+}
+
+bool ov::util::getenv_bool(const char* env_var, bool default_value) {
+    std::string value = ov::util::to_lower(ov::util::getenv_string(env_var));
+    std::set<std::string> off = {"0", "false", "off"};
+    std::set<std::string> on = {"1", "true", "on"};
+    bool rc;
+    if (value == "") {
+        rc = default_value;
+    } else if (off.find(value) != off.end()) {
+        rc = false;
+    } else if (on.find(value) != on.end()) {
+        rc = true;
+    } else {
+        std::stringstream ss;
+        ss << "environment variable '" << env_var << "' value '" << value << "' invalid. Must be boolean.";
+        throw std::runtime_error(ss.str());
+    }
+    return rc;
+}
diff --git a/openvino/util/src/file_util.cpp b/openvino/util/src/file_util.cpp
new file mode 100644
index 00000000000..f3b1653d0a2
--- /dev/null
+++ b/openvino/util/src/file_util.cpp
@@ -0,0 +1,372 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+#include "openvino/util/file_util.hpp"
+
+#include <sys/stat.h>
+
+#include <algorithm>
+#include <cstdlib>
+#include <cstring>
+#include <fstream>
+#include <sstream>
+
+#include "openvino/util/common_util.hpp"
+
+#ifdef _WIN32
+#    ifndef NOMINMAX
+#        define NOMINMAX
+#    endif
+#    include <direct.h>
+#    include <windows.h>
+/// @brief Max length of absolute file path
+#    define MAX_ABS_PATH _MAX_PATH
+/// @brief Get absolute file path, returns NULL in case of error
+#    define get_absolute_path(result, path) _fullpath(result, path.c_str(), MAX_ABS_PATH)
+/// @brief Windows-specific 'stat' wrapper
+#    define stat _stat
+/// @brief Windows-specific 'mkdir' wrapper
+#    define makedir(dir) _mkdir(dir)
+// Copied from linux libc sys/stat.h:
+#    define S_ISDIR(m) (((m)&S_IFMT) == S_IFDIR)
+#else
+#    include <dirent.h>
+#    include <dlfcn.h>
+#    include <ftw.h>
+#    include <sys/file.h>
+#    include <sys/time.h>
+#    include <unistd.h>
+
+#    ifdef ENABLE_UNICODE_PATH_SUPPORT
+#        include <codecvt>
+#        include <locale>
+#    endif
+
+/// @brief Max length of absolute file path
+#    define MAX_ABS_PATH                    PATH_MAX
+/// @brief Get absolute file path, returns NULL in case of error
+#    define get_absolute_path(result, path) realpath(path.c_str(), result)
+/// @brief mkdir wrapper
+#    define makedir(dir)                    mkdir(dir, 0755)
+#endif
+
+std::string ov::util::get_file_name(const std::string& s) {
+    std::string rc = s;
+    auto pos = s.find_last_of('/');
+    if (pos != std::string::npos) {
+        rc = s.substr(pos + 1);
+    }
+    return rc;
+}
+
+std::string ov::util::get_file_ext(const std::string& s) {
+    std::string rc = get_file_name(s);
+    auto pos = rc.find_last_of('.');
+    if (pos != std::string::npos) {
+        rc = rc.substr(pos);
+    } else {
+        rc = "";
+    }
+    return rc;
+}
+
+std::string ov::util::get_directory(const std::string& s) {
+    std::string rc = s;
+    // Linux-style separator
+    auto pos = s.find_last_of('/');
+    if (pos != std::string::npos) {
+        rc = s.substr(0, pos);
+        return rc;
+    }
+    // Windows-style separator
+    pos = s.find_last_of('\\');
+    if (pos != std::string::npos) {
+        rc = s.substr(0, pos);
+        return rc;
+    }
+    return rc;
+}
+
+namespace {
+
+std::string join_paths(const std::string& s1, const std::string& s2) {
+    std::string rc;
+    if (s2.size() > 0) {
+        if (s2[0] == '/') {
+            rc = s2;
+        } else if (s1.size() > 0) {
+            rc = s1;
+            if (rc[rc.size() - 1] != '/') {
+                rc += '/';
+            }
+            rc += s2;
+        } else {
+            rc = s2;
+        }
+    } else {
+        rc = s1;
+    }
+    return rc;
+}
+}  // namespace
+
+std::string ov::util::path_join(const std::vector<std::string>& paths) {
+    std::string result;
+    if (paths.empty()) {
+        return result;
+    }
+    result = paths[0];
+    for (size_t i = 1; i < paths.size(); i++) {
+        result = join_paths(result, paths[i]);
+    }
+    return result;
+}
+
+#ifndef _WIN32
+static void iterate_files_worker(const std::string& path,
+                                 const std::function<void(const std::string& file, bool is_dir)>& func,
+                                 bool recurse,
+                                 bool include_links) {
+    DIR* dir;
+    struct dirent* ent;
+    if ((dir = opendir(path.c_str())) != nullptr) {
+        try {
+            while ((ent = readdir(dir)) != nullptr) {
+                std::string name = ent->d_name;
+                std::string path_name = ov::util::path_join({path, name});
+                switch (ent->d_type) {
+                case DT_DIR:
+                    if (name != "." && name != "..") {
+                        if (recurse) {
+                            ov::util::iterate_files(path_name, func, recurse);
+                        }
+                        func(path_name, true);
+                    }
+                    break;
+                case DT_LNK:
+                    if (include_links) {
+                        func(path_name, false);
+                    }
+                    break;
+                case DT_REG:
+                    func(path_name, false);
+                    break;
+                default:
+                    break;
+                }
+            }
+        } catch (...) {
+            std::exception_ptr p = std::current_exception();
+            closedir(dir);
+            std::rethrow_exception(p);
+        }
+        closedir(dir);
+    } else {
+        throw std::runtime_error("error enumerating file " + path);
+    }
+}
+#endif
+
+void ov::util::iterate_files(const std::string& path,
+                             const std::function<void(const std::string& file, bool is_dir)>& func,
+                             bool recurse,
+                             bool include_links) {
+    std::vector<std::string> files;
+    std::vector<std::string> dirs;
+#ifdef _WIN32
+    std::string file_match = path_join({path, "*"});
+    WIN32_FIND_DATAA data;
+    HANDLE hFind = FindFirstFileA(file_match.c_str(), &data);
+    if (hFind != INVALID_HANDLE_VALUE) {
+        do {
+            bool is_dir = data.dwFileAttributes == FILE_ATTRIBUTE_DIRECTORY;
+            if (is_dir) {
+                if (std::string(data.cFileName) != "." && std::string(data.cFileName) != "..") {
+                    std::string dir_path = path_join({path, data.cFileName});
+                    if (recurse) {
+                        iterate_files(dir_path, func, recurse);
+                    }
+                    func(dir_path, true);
+                }
+            } else {
+                std::string file_name = path_join({path, data.cFileName});
+                func(file_name, false);
+            }
+        } while (FindNextFileA(hFind, &data));
+        FindClose(hFind);
+    }
+#else
+    iterate_files_worker(
+        path,
+        [&files, &dirs](const std::string& file, bool is_dir) {
+            if (is_dir) {
+                dirs.push_back(file);
+            } else {
+                files.push_back(file);
+            }
+        },
+        recurse,
+        include_links);
+#endif
+
+    for (const auto& f : files) {
+        func(f, false);
+    }
+    for (const auto& f : dirs) {
+        func(f, true);
+    }
+}
+
+std::string ov::util::sanitize_path(const std::string& path) {
+    const auto colon_pos = path.find(':');
+    const auto sanitized_path = path.substr(colon_pos == std::string::npos ? 0 : colon_pos + 1);
+    const std::string to_erase = "/.\\";
+    const auto start = sanitized_path.find_first_not_of(to_erase);
+    return (start == std::string::npos) ? "" : sanitized_path.substr(start);
+}
+
+void ov::util::convert_path_win_style(std::string& path) {
+    std::replace(path.begin(), path.end(), '/', '\\');
+}
+
+#ifdef ENABLE_UNICODE_PATH_SUPPORT
+std::string ov::util::wstring_to_string(const std::wstring& wstr) {
+#    ifdef _WIN32
+    int size_needed = WideCharToMultiByte(CP_UTF8, 0, &wstr[0], (int)wstr.size(), NULL, 0, NULL, NULL);
+    std::string strTo(size_needed, 0);
+    WideCharToMultiByte(CP_UTF8, 0, &wstr[0], (int)wstr.size(), &strTo[0], size_needed, NULL, NULL);
+    return strTo;
+#    else
+    std::wstring_convert<std::codecvt_utf8<wchar_t>> wstring_decoder;
+    return wstring_decoder.to_bytes(wstr);
+#    endif
+}
+
+std::wstring ov::util::string_to_wstring(const std::string& string) {
+    const char* str = string.c_str();
+#    ifdef _WIN32
+    int strSize = static_cast<int>(std::strlen(str));
+    int size_needed = MultiByteToWideChar(CP_UTF8, 0, str, strSize, NULL, 0);
+    std::wstring wstrTo(size_needed, 0);
+    MultiByteToWideChar(CP_UTF8, 0, str, strSize, &wstrTo[0], size_needed);
+    return wstrTo;
+#    else
+    std::wstring_convert<std::codecvt_utf8<wchar_t>> wstring_encoder;
+    std::wstring result = wstring_encoder.from_bytes(str);
+    return result;
+#    endif
+}
+#endif
+
+std::string ov::util::get_absolute_file_path(const std::string& path) {
+    std::string absolutePath;
+    absolutePath.resize(MAX_ABS_PATH);
+    auto absPath = get_absolute_path(&absolutePath[0], path);
+    if (!absPath) {
+        std::stringstream ss;
+        ss << "Can't get absolute file path for [" << path << "], err = " << strerror(errno);
+        throw std::runtime_error(ss.str());
+    }
+    absolutePath.resize(strlen(absPath));
+    return absolutePath;
+}
+
+void ov::util::create_directory_recursive(const std::string& path) {
+    if (path.empty() || directory_exists(path)) {
+        return;
+    }
+
+    std::size_t pos = path.rfind(ov::util::FileTraits<char>::file_separator);
+    if (pos != std::string::npos) {
+        create_directory_recursive(path.substr(0, pos));
+    }
+
+    int err = makedir(path.c_str());
+    if (err != 0 && errno != EEXIST) {
+        std::stringstream ss;
+        // TODO: in case of exception it may be needed to remove all created sub-directories
+        ss << "Couldn't create directory [" << path << "], err=" << strerror(errno) << ")";
+        throw std::runtime_error(ss.str());
+    }
+}
+
+bool ov::util::directory_exists(const std::string& path) {
+    struct stat sb;
+
+    if (stat(path.c_str(), &sb) == 0 && S_ISDIR(sb.st_mode)) {
+        return true;
+    }
+    return false;
+}
+
+namespace {
+
+template <typename C,
+          typename = typename std::enable_if<(std::is_same<C, char>::value || std::is_same<C, wchar_t>::value)>::type>
+std::basic_string<C> get_path_name(const std::basic_string<C>& s) {
+    size_t i = s.rfind(ov::util::FileTraits<C>::file_separator, s.length());
+    if (i != std::string::npos) {
+        return (s.substr(0, i));
+    }
+
+    return {};
+}
+
+static std::string get_ov_library_path_a() {
+#ifdef _WIN32
+    CHAR ov_library_path[MAX_PATH];
+    HMODULE hm = NULL;
+    if (!GetModuleHandleExA(GET_MODULE_HANDLE_EX_FLAG_FROM_ADDRESS | GET_MODULE_HANDLE_EX_FLAG_UNCHANGED_REFCOUNT,
+                            reinterpret_cast<LPSTR>(ov::util::get_ov_lib_path),
+                            &hm)) {
+        std::stringstream ss;
+        ss << "GetModuleHandle returned " << GetLastError();
+        throw std::runtime_error(ss.str());
+    }
+    GetModuleFileNameA(hm, (LPSTR)ov_library_path, sizeof(ov_library_path));
+    return get_path_name(std::string(ov_library_path));
+#elif defined(__APPLE__) || defined(__linux__)
+    Dl_info info;
+    dladdr(reinterpret_cast<void*>(ov::util::get_ov_lib_path), &info);
+    std::string result = get_path_name(std::string(info.dli_fname)).c_str();
+    if (!ov::util::ends_with(result, "/lib") && !ov::util::ends_with(result, "/lib/"))
+        result = ov::util::path_join({result, "lib"});
+    return result;
+#else
+#    error "Unsupported OS"
+#endif  // _WIN32
+}
+
+}  // namespace
+
+std::string ov::util::get_ov_lib_path() {
+#ifdef ENABLE_UNICODE_PATH_SUPPORT
+    return ov::util::wstring_to_string(ov::util::get_ov_lib_path_w());
+#else
+    return get_ov_library_path_a();
+#endif
+}
+
+#ifdef ENABLE_UNICODE_PATH_SUPPORT
+
+std::wstring ov::util::get_ov_lib_path_w() {
+#    ifdef _WIN32
+    WCHAR ov_library_path[MAX_PATH];
+    HMODULE hm = NULL;
+    if (!GetModuleHandleExW(GET_MODULE_HANDLE_EX_FLAG_FROM_ADDRESS | GET_MODULE_HANDLE_EX_FLAG_UNCHANGED_REFCOUNT,
+                            reinterpret_cast<LPCWSTR>(get_ov_lib_path),
+                            &hm)) {
+        std::stringstream ss;
+        ss << "GetModuleHandle returned " << GetLastError();
+        throw std::runtime_error(ss.str());
+    }
+    GetModuleFileNameW(hm, (LPWSTR)ov_library_path, sizeof(ov_library_path) / sizeof(ov_library_path[0]));
+    return get_path_name(std::wstring(ov_library_path));
+#    elif defined(__linux__) || defined(__APPLE__)
+    return ov::util::string_to_wstring(get_ov_library_path_a());
+#    else
+#        error "Unsupported OS"
+#    endif
+}
+
+#endif  // ENABLE_UNICODE_PATH_SUPPORT
diff --git a/openvino/util/src/log.cpp b/openvino/util/src/log.cpp
new file mode 100644
index 00000000000..a16c5f2af6b
--- /dev/null
+++ b/openvino/util/src/log.cpp
@@ -0,0 +1,54 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "openvino/util/log.hpp"
+
+#include <chrono>
+#include <ctime>
+#include <functional>
+#include <iostream>
+
+void ov::util::default_logger_handler_func(const std::string& s) {
+    std::cout << s << std::endl;
+}
+
+ov::util::LogHelper::LogHelper(LOG_TYPE type,
+                               const char* file,
+                               int line,
+                               std::function<void(const std::string&)> handler_func)
+    : m_handler_func(std::move(handler_func)) {
+    switch (type) {
+    case LOG_TYPE::_LOG_TYPE_ERROR:
+        m_stream << "[ERR] ";
+        break;
+    case LOG_TYPE::_LOG_TYPE_WARNING:
+        m_stream << "[WARN] ";
+        break;
+    case LOG_TYPE::_LOG_TYPE_INFO:
+        m_stream << "[INFO] ";
+        break;
+    case LOG_TYPE::_LOG_TYPE_DEBUG:
+        m_stream << "[DEBUG] ";
+        break;
+    }
+
+    time_t tt = std::chrono::system_clock::to_time_t(std::chrono::system_clock::now());
+    auto tm = gmtime(&tt);
+    if (tm) {
+        char buffer[256];
+        strftime(buffer, sizeof(buffer), "%Y-%m-%dT%H:%M:%Sz", tm);
+        m_stream << buffer << " ";
+    }
+
+    m_stream << file;
+    m_stream << " " << line;
+    m_stream << "\t";
+}
+
+ov::util::LogHelper::~LogHelper() {
+    if (m_handler_func) {
+        m_handler_func(m_stream.str());
+    }
+    // Logger::log_item(m_stream.str());
+}
diff --git a/runtime/bindings/python/src/compatibility/ngraph/impl/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/impl/__init__.py
index 259a6e277f0..b4b04162a8b 100644
--- a/runtime/bindings/python/src/compatibility/ngraph/impl/__init__.py
+++ b/runtime/bindings/python/src/compatibility/ngraph/impl/__init__.py
@@ -48,5 +48,5 @@ from _pyngraph import AxisSet
 from _pyngraph import AxisVector
 from _pyngraph import Coordinate
 from _pyngraph import Output
-
+from _pyngraph import DiscreteTypeInfo
 from _pyngraph import util
diff --git a/runtime/bindings/python/src/compatibility/pyngraph/discrete_type_info.cpp b/runtime/bindings/python/src/compatibility/pyngraph/discrete_type_info.cpp
new file mode 100644
index 00000000000..f9b86ae952a
--- /dev/null
+++ b/runtime/bindings/python/src/compatibility/pyngraph/discrete_type_info.cpp
@@ -0,0 +1,44 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "pyngraph/discrete_type_info.hpp"
+
+#include <pybind11/pybind11.h>
+#include <pybind11/stl.h>
+#include <pybind11/stl_bind.h>
+
+#include "ngraph/type.hpp"
+
+namespace py = pybind11;
+
+void regclass_pyngraph_DiscreteTypeInfo(py::module m) {
+    py::class_<ngraph::DiscreteTypeInfo, std::shared_ptr<ngraph::DiscreteTypeInfo>> discrete_type_info(
+        m,
+        "DiscreteTypeInfo");
+    discrete_type_info.doc() = "ngraph.impl.DiscreteTypeInfo wraps ngraph::DiscreteTypeInfo";
+
+    // operator overloading
+    discrete_type_info.def(py::self < py::self);
+    discrete_type_info.def(py::self <= py::self);
+    discrete_type_info.def(py::self > py::self);
+    discrete_type_info.def(py::self >= py::self);
+    discrete_type_info.def(py::self == py::self);
+    discrete_type_info.def(py::self != py::self);
+
+    discrete_type_info.def_readonly("name", &ngraph::DiscreteTypeInfo::name);
+    discrete_type_info.def_readonly("version", &ngraph::DiscreteTypeInfo::version);
+    discrete_type_info.def_readonly("parent", &ngraph::DiscreteTypeInfo::parent);
+
+    discrete_type_info.def("__repr__", [](const ngraph::DiscreteTypeInfo& self) {
+        std::string name = std::string(self.name);
+        std::string version = std::to_string(self.version);
+        if (self.parent != nullptr) {
+            std::string parent_version = std::to_string(self.parent->version);
+            std::string parent_name = self.parent->name;
+            return "<DiscreteTypeInfo: " + name + " v" + version + " Parent(" + parent_name + " v" + parent_version +
+                   ")" + ">";
+        }
+        return "<DiscreteTypeInfo: " + name + " v" + version + ">";
+    });
+}
diff --git a/runtime/bindings/python/src/compatibility/pyngraph/discrete_type_info.hpp b/runtime/bindings/python/src/compatibility/pyngraph/discrete_type_info.hpp
new file mode 100644
index 00000000000..bf911ceb23a
--- /dev/null
+++ b/runtime/bindings/python/src/compatibility/pyngraph/discrete_type_info.hpp
@@ -0,0 +1,11 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <pybind11/pybind11.h>
+
+namespace py = pybind11;
+
+void regclass_pyngraph_DiscreteTypeInfo(py::module m);
diff --git a/runtime/bindings/python/src/compatibility/pyngraph/node.cpp b/runtime/bindings/python/src/compatibility/pyngraph/node.cpp
index 3c7436d2dc8..c12c3ac6413 100644
--- a/runtime/bindings/python/src/compatibility/pyngraph/node.cpp
+++ b/runtime/bindings/python/src/compatibility/pyngraph/node.cpp
@@ -18,6 +18,17 @@
 #include "pyngraph/rt_map.hpp"
 #include "pyngraph/variant.hpp"
 
+class PyNode : public ngraph::Node {
+public:
+    std::shared_ptr<ngraph::Node> clone_with_new_inputs(const ngraph::OutputVector& inputs) const override {
+        PYBIND11_OVERRIDE_PURE(std::shared_ptr<ngraph::Node>, ngraph::Node, clone_with_new_inputs, inputs);
+    }
+
+    const type_info_t& get_type_info() const override {
+        PYBIND11_OVERRIDE_PURE(type_info_t&, ngraph::Node, get_type_info, );
+    }
+};
+
 namespace py = pybind11;
 
 using PyRTMap = std::map<std::string, std::shared_ptr<ngraph::Variant>>;
@@ -25,7 +36,7 @@ using PyRTMap = std::map<std::string, std::shared_ptr<ngraph::Variant>>;
 PYBIND11_MAKE_OPAQUE(PyRTMap);
 
 void regclass_pyngraph_Node(py::module m) {
-    py::class_<ngraph::Node, std::shared_ptr<ngraph::Node>> node(m, "Node", py::dynamic_attr());
+    py::class_<ngraph::Node, std::shared_ptr<ngraph::Node>, PyNode> node(m, "Node", py::dynamic_attr());
     node.doc() = "ngraph.impl.Node wraps ngraph::Node";
     node.def(
         "__add__",
@@ -146,7 +157,7 @@ void regclass_pyngraph_Node(py::module m) {
                 Returns
                 ----------
                 get_type_name : str
-                    String repesenting Type's name. 
+                    String repesenting Type's name.
              )");
     node.def("get_name",
              &ngraph::Node::get_name,
@@ -161,7 +172,7 @@ void regclass_pyngraph_Node(py::module m) {
     node.def("get_friendly_name",
              &ngraph::Node::get_friendly_name,
              R"(
-                Gets the friendly name for a node. If no friendly name has 
+                Gets the friendly name for a node. If no friendly name has
                 been set via set_friendly_name then the node's unique name
                 is returned.
 
@@ -170,12 +181,13 @@ void regclass_pyngraph_Node(py::module m) {
                 get_name : str
                     Friendly name of the node.
              )");
+    node.def("get_type_info", &ngraph::Node::get_type_info);
     node.def("set_friendly_name",
              &ngraph::Node::set_friendly_name,
              py::arg("name"),
              R"(
                 Sets a friendly name for a node. This does not overwrite the unique name
-                of the node and is retrieved via get_friendly_name(). Used mainly for 
+                of the node and is retrieved via get_friendly_name(). Used mainly for
                 debugging. The friendly name may be set exactly once.
 
                 Parameters
@@ -257,12 +269,21 @@ void regclass_pyngraph_Node(py::module m) {
                     Operation version.
              )");
 
+    node.def("set_argument", &ngraph::Node::set_argument);
+    node.def("set_arguments", [](const std::shared_ptr<ngraph::Node>& self, const ngraph::NodeVector& args) {
+        self->set_arguments(args);
+    });
+    node.def("set_arguments", [](const std::shared_ptr<ngraph::Node>& self, const ngraph::OutputVector& args) {
+        self->set_arguments(args);
+    });
+
     node.def_property_readonly("shape", &ngraph::Node::get_shape);
     node.def_property_readonly("name", &ngraph::Node::get_name);
     node.def_property_readonly("rt_info",
                                (PyRTMap & (ngraph::Node::*)()) & ngraph::Node::get_rt_info,
                                py::return_value_policy::reference_internal);
     node.def_property_readonly("version", &ngraph::Node::get_version);
+    node.def_property_readonly("type_info", &ngraph::Node::get_type_info);
     node.def_property("friendly_name", &ngraph::Node::get_friendly_name, &ngraph::Node::set_friendly_name);
 
     node.def("get_attributes", [](const std::shared_ptr<ngraph::Node>& self) {
diff --git a/runtime/bindings/python/src/compatibility/pyngraph/pyngraph.cpp b/runtime/bindings/python/src/compatibility/pyngraph/pyngraph.cpp
index 91ec09d71e7..75097734960 100644
--- a/runtime/bindings/python/src/compatibility/pyngraph/pyngraph.cpp
+++ b/runtime/bindings/python/src/compatibility/pyngraph/pyngraph.cpp
@@ -17,6 +17,7 @@
 #    include "pyngraph/onnx_import/onnx_import.hpp"
 #endif
 #include "pyngraph/dimension.hpp"
+#include "pyngraph/discrete_type_info.hpp"
 #include "pyngraph/frontend/frontend.hpp"
 #include "pyngraph/frontend/frontend_manager.hpp"
 #include "pyngraph/frontend/inputmodel.hpp"
@@ -58,6 +59,7 @@ PYBIND11_MODULE(_pyngraph, m) {
     regclass_pyngraph_NodeFactory(m);
     regclass_pyngraph_Strides(m);
     regclass_pyngraph_CoordinateDiff(m);
+    regclass_pyngraph_DiscreteTypeInfo(m);
     regclass_pyngraph_AxisSet(m);
     regclass_pyngraph_AxisVector(m);
     regclass_pyngraph_Coordinate(m);
diff --git a/runtime/bindings/python/tests/__init__.py b/runtime/bindings/python/tests/__init__.py
index 7c603670452..13fdeb51ebb 100644
--- a/runtime/bindings/python/tests/__init__.py
+++ b/runtime/bindings/python/tests/__init__.py
@@ -23,65 +23,65 @@ def xfail_test(reason="Mark the test as expected to fail", strict=True):
 
 
 skip_segfault = pytest.mark.skip(reason="Segmentation fault error")
-xfail_issue_33488 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_33488 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "MaxUnpool")
-xfail_issue_33538 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_33538 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "Scan")
 skip_issue_38084 = pytest.mark.skip(reason="Aborted (core dumped) Assertion "
                                            "`(layer->get_output_partial_shape(i).is_static())' failed.")
-xfail_issue_33589 = xfail_test(reason="nGraph does not support the following ONNX operations:"
+xfail_issue_33589 = xfail_test(reason="nGraph does not support the following ONNX operations: "
                                       "IsNaN and isInf")
-xfail_issue_33595 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_33595 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "Unique")
-xfail_issue_33596 = xfail_test(reason="RuntimeError: nGraph does not support different sequence operations:"
-                                      "ConcatFromSequence, SequenceConstruct, SequenceAt, SplitToSequence,"
+xfail_issue_33596 = xfail_test(reason="RuntimeError: nGraph does not support different sequence operations: "
+                                      "ConcatFromSequence, SequenceConstruct, SequenceAt, SplitToSequence, "
                                       "SequenceEmpty, SequenceInsert, SequenceErase, SequenceLength ")
-xfail_issue_33606 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_33606 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "Det")
-xfail_issue_33651 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_33651 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "TfIdfVectorizer")
-xfail_issue_33581 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_33581 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "GatherElements")
 xfail_issue_33633 = xfail_test(reason="MaxPool: dilations unsupported")
 xfail_issue_35923 = xfail_test(reason="RuntimeError: PReLU without weights is not supported")
 xfail_issue_35927 = xfail_test(reason="RuntimeError: B has zero dimension that is not allowable")
 xfail_issue_36486 = xfail_test(reason="RuntimeError: HardSigmoid operation should be converted "
                                       "to HardSigmoid_IE")
-xfail_issue_38084 = xfail_test(reason="RuntimeError: AssertionFailed: layer->get_output_partial_shape(i)"
-                                      "is_static() nGraph <value> operation with name: <value> cannot be"
-                                      "converted to <value> layer with name: <value> because output"
+xfail_issue_38084 = xfail_test(reason="RuntimeError: AssertionFailed: layer->get_output_partial_shape(i)."
+                                      "is_static() nGraph <value> operation with name: <value> cannot be "
+                                      "converted to <value> layer with name: <value> because output "
                                       "with index 0 contains dynamic shapes: {<value>}. Try to use "
                                       "CNNNetwork::reshape() method in order to specialize shapes "
                                       "before the conversion.")
 xfail_issue_38091 = xfail_test(reason="AssertionError: Mismatched elements")
-xfail_issue_38699 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_38699 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "ai.onnx.preview.training.Gradient")
 xfail_issue_38701 = xfail_test(reason="RuntimeError: unsupported element type: STRING")
 xfail_issue_38706 = xfail_test(reason="RuntimeError: output_3.0 has zero dimension which is not allowed")
 xfail_issue_38708 = xfail_test(reason="RuntimeError: While validating ONNX node '<Node(Slice): y>': "
                                       "Axes input must be constant")
 xfail_issue_38710 = xfail_test(reason="RuntimeError: data has zero dimension which is not allowed")
-xfail_issue_38713 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_38713 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "ai.onnx.preview.training.Momentum")
-xfail_issue_45457 = xfail_test(reason="RuntimeError: Unsupported dynamic ops: v5::Loop"
+xfail_issue_45457 = xfail_test(reason="RuntimeError: Unsupported dynamic ops: v5::Loop "
                                       "Not constant termination condition body output is not supported")
-xfail_issue_38722 = xfail_test(reason="RuntimeError: While validating ONNX nodes MatMulInteger"
-                                      "and QLinearMatMul"
+xfail_issue_38722 = xfail_test(reason="RuntimeError: While validating ONNX nodes MatMulInteger "
+                                      "and QLinearMatMul "
                                       "Input0 scale and input0 zero point shape must be same and 1")
-xfail_issue_38724 = xfail_test(reason="RuntimeError: While validating ONNX node '<Node(Resize): Y>':"
-                                      "tf_crop_and_resize - this type of coordinate transformation mode"
-                                      "is not supported. Choose one of the following modes:"
-                                      "tf_half_pixel_for_nn, asymmetric, align_corners, pytorch_half_pixel,"
+xfail_issue_38724 = xfail_test(reason="RuntimeError: While validating ONNX node '<Node(Resize): Y>': "
+                                      "tf_crop_and_resize - this type of coordinate transformation mode "
+                                      "is not supported. Choose one of the following modes: "
+                                      "tf_half_pixel_for_nn, asymmetric, align_corners, pytorch_half_pixel, "
                                       "half_pixel")
-xfail_issue_38725 = xfail_test(reason="RuntimeError: While validating ONNX node '<Node(Loop):"
+xfail_issue_38725 = xfail_test(reason="RuntimeError: While validating ONNX node '<Node(Loop): "
                                       "value info has no element type specified")
-xfail_issue_38726 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_38726 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "LessOrEqual")
-xfail_issue_38732 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_38732 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "ConvInteger")
-xfail_issue_38734 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_38734 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "ai.onnx.preview.training.Adam")
-xfail_issue_38735 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
+xfail_issue_38735 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
                                       "ai.onnx.preview.training.Adagrad")
 xfail_issue_48052 = xfail_test(reason="Dropout op is not supported in traning mode")
 xfail_issue_45180 = xfail_test(reason="RuntimeError: Unsupported dynamic op: ReduceSum")
@@ -100,8 +100,8 @@ xfail_issue_33593 = xfail_test(reason="Current implementation of MaxPool doesn't
 xfail_issue_55760 = xfail_test(reason="RuntimeError: Reversed axis have axes above the source space shape")
 
 # Model MSFT issues:
-xfail_issue_37957 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
-                                      "com.microsoft.CropAndResize, com.microsoft.GatherND,"
+xfail_issue_37957 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations: "
+                                      "com.microsoft.CropAndResize, com.microsoft.GatherND, "
                                       "com.microsoft.Pad, com.microsoft.Range")
 xfail_issue_39669 = xfail_test(reason="AssertionError: This model has no test data")
 xfail_issue_36534 = xfail_test(reason="RuntimeError: node input index is out of range")
diff --git a/runtime/bindings/python/tests/test_ngraph/test_basic.py b/runtime/bindings/python/tests/test_ngraph/test_basic.py
index af6d9bb57ce..2ec656a800b 100644
--- a/runtime/bindings/python/tests/test_ngraph/test_basic.py
+++ b/runtime/bindings/python/tests/test_ngraph/test_basic.py
@@ -253,6 +253,44 @@ def test_constant_get_data_unsigned_integer(data_type):
     assert np.allclose(input_data, retrieved_data)
 
 
+def test_set_argument():
+    runtime = get_runtime()
+
+    data1 = np.array([1, 2, 3])
+    data2 = np.array([4, 5, 6])
+    data3 = np.array([7, 8, 9])
+
+    node1 = ng.constant(data1, dtype=np.float32)
+    node2 = ng.constant(data2, dtype=np.float32)
+    node3 = ng.constant(data3, dtype=np.float32)
+    node_add = ng.add(node1, node2)
+
+    # Original arguments
+    computation = runtime.computation(node_add)
+    output = computation()
+    assert np.allclose(data1 + data2, output)
+
+    # Arguments changed by set_argument
+    node_add.set_argument(1, node3.output(0))
+    output = computation()
+    assert np.allclose(data1 + data3, output)
+
+    # Arguments changed by set_argument
+    node_add.set_argument(0, node3.output(0))
+    output = computation()
+    assert np.allclose(data3 + data3, output)
+
+    # Arguments changed by set_argument(OutputVector)
+    node_add.set_arguments([node2.output(0), node3.output(0)])
+    output = computation()
+    assert np.allclose(data2 + data3, output)
+
+    # Arguments changed by set_arguments(NodeVector)
+    node_add.set_arguments([node1, node2])
+    output = computation()
+    assert np.allclose(data1 + data2, output)
+
+
 def test_result():
     node = np.array([[11, 10], [1, 8], [3, 4]])
     result = run_op_node([node], ng.result)
diff --git a/runtime/bindings/python/tests/test_ngraph/test_core.py b/runtime/bindings/python/tests/test_ngraph/test_core.py
index 87974c6e527..9b7a6336508 100644
--- a/runtime/bindings/python/tests/test_ngraph/test_core.py
+++ b/runtime/bindings/python/tests/test_ngraph/test_core.py
@@ -234,3 +234,29 @@ def test_repr_dynamic_shape():
     ops = function.get_ordered_ops()
     for op in ops:
         assert "{?,2}" in repr(op)
+
+
+def test_discrete_type_info():
+    data_shape = [6, 12, 10, 24]
+    data_parameter = ng.parameter(data_shape, name="Data", dtype=np.float32)
+    k = np.int32(3)
+    axis = np.int32(1)
+    n1 = ng.topk(data_parameter, k, axis, "max", "value")
+    n2 = ng.topk(data_parameter, k, axis, "max", "value")
+    n3 = ng.sin(0.2)
+
+    assert n1.type_info.name == "TopK"
+    assert n3.type_info.name == "Sin"
+    assert n1.get_type_info().name == "TopK"
+    assert n3.get_type_info().name == "Sin"
+    assert n1.type_info.name == n2.type_info.name
+    assert n1.type_info.version == n2.type_info.version
+    assert n1.type_info.parent == n2.type_info.parent
+    assert n1.get_type_info().name == n2.get_type_info().name
+    assert n1.get_type_info().version == n2.get_type_info().version
+    assert n1.get_type_info().parent == n2.get_type_info().parent
+    assert n1.get_type_info().name != n3.get_type_info().name
+    assert n1.get_type_info().name > n3.get_type_info().name
+    assert n1.get_type_info().name >= n3.get_type_info().name
+    assert n3.get_type_info().name < n1.get_type_info().name
+    assert n3.get_type_info().name <= n1.get_type_info().name
diff --git a/scripts/demo/run_sample_benchmark_app.sh b/scripts/demo/run_sample_benchmark_app.sh
old mode 100644
new mode 100755
diff --git a/scripts/demo/run_sample_squeezenet.sh b/scripts/demo/run_sample_squeezenet.sh
old mode 100644
new mode 100755
diff --git a/scripts/demo/utils.sh b/scripts/demo/utils.sh
old mode 100755
new mode 100644
diff --git a/scripts/setupvars/setupvars.bat b/scripts/setupvars/setupvars.bat
index 364c651be48..2caebe22291 100644
--- a/scripts/setupvars/setupvars.bat
+++ b/scripts/setupvars/setupvars.bat
@@ -23,12 +23,15 @@ if not "%1"=="" (
 )
 
 :: OpenCV
+if exist "%INTEL_OPENVINO_DIR%\extras\opencv\setupvars.bat" (
+call "%INTEL_OPENVINO_DIR%\extras\opencv\setupvars.bat"
+goto :opencv_done
+)
 if exist "%INTEL_OPENVINO_DIR%\opencv\setupvars.bat" (
 call "%INTEL_OPENVINO_DIR%\opencv\setupvars.bat"
-) else (
-set "OpenCV_DIR=%INTEL_OPENVINO_DIR%\opencv\x64\vc14\lib"
-set "PATH=%INTEL_OPENVINO_DIR%\opencv\x64\vc14\bin;%PATH%"
+goto :opencv_done
 )
+:opencv_done
 
 :: Model Optimizer
 if exist %INTEL_OPENVINO_DIR%\tools\model_optimizer (
@@ -118,8 +121,8 @@ if exist %INTEL_OPENVINO_DIR%\tools\accuracy_checker (
     set PYTHONPATH=%INTEL_OPENVINO_DIR%\tools\accuracy_checker;%PYTHONPATH%
 )
 
-if exist %INTEL_OPENVINO_DIR%\post_training_optimization_toolkit (
-    set PYTHONPATH=%INTEL_OPENVINO_DIR%\post_training_optimization_toolkit;%PYTHONPATH%
+if exist %INTEL_OPENVINO_DIR%\tools\post_training_optimization_toolkit (
+    set PYTHONPATH=%INTEL_OPENVINO_DIR%\tools\post_training_optimization_toolkit;%PYTHONPATH%
 )
 
 echo [setupvars.bat] OpenVINO environment initialized
diff --git a/scripts/setupvars/setupvars.sh b/scripts/setupvars/setupvars.sh
index fc6251211e6..739d8fc2721 100755
--- a/scripts/setupvars/setupvars.sh
+++ b/scripts/setupvars/setupvars.sh
@@ -60,15 +60,12 @@ if [ -e "$INSTALLDIR/tools/compile_tool" ]; then
     export LD_LIBRARY_PATH=$INSTALLDIR/tools/compile_tool${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}
 fi
 
-if [ -e "$INSTALLDIR/opencv" ]; then
-    if [ -f "$INSTALLDIR/opencv/setupvars.sh" ]; then
-        source "$INSTALLDIR/opencv/setupvars.sh"
-    else
-        export OpenCV_DIR="$INSTALLDIR/opencv/share/OpenCV"
-        export LD_LIBRARY_PATH="$INSTALLDIR/opencv/lib${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}"
-        export LD_LIBRARY_PATH="$INSTALLDIR/opencv/share/OpenCV/3rdparty/lib${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}"
-    fi
-fi
+
+# OpenCV environment
+for _loc in "extras/opencv" "opencv" ; do
+    _fname="$INSTALLDIR/${_loc}/setupvars.sh"
+    [ -f "${_fname}"  ] && source "${_fname}" && break
+done
 
 
 if [ -f "$INTEL_OPENVINO_DIR/extras/dl_streamer/setupvars.sh" ]; then
@@ -102,13 +99,13 @@ if command -v lsb_release >/dev/null 2>&1; then
     OS_NAME=$(lsb_release -i -s)
 fi
 
-python_bitness=$(python3 -c 'import sys; print(64 if sys.maxsize > 2**32 else 32)')   
+python_bitness=$(python3 -c 'import sys; print(64 if sys.maxsize > 2**32 else 32)')
 if [ "$python_bitness" != "" ] && [ "$python_bitness" != "64" ] && [ "$OS_NAME" != "Raspbian" ]; then
     echo "[setupvars.sh] 64 bitness for Python $python_version is required"
 fi
 
 MINIMUM_REQUIRED_PYTHON_VERSION="3.6"
-MAX_SUPPORTED_PYTHON_VERSION=$([[ "$OSTYPE" == "darwin"* ]] && echo '3.7' || echo '3.8') 
+MAX_SUPPORTED_PYTHON_VERSION=$([[ "$OSTYPE" == "darwin"* ]] && echo '3.7' || echo '3.8')
 if [[ -n "$python_version" && "$(printf '%s\n' "$python_version" "$MINIMUM_REQUIRED_PYTHON_VERSION" | sort -V | head -n 1)" != "$MINIMUM_REQUIRED_PYTHON_VERSION" ]]; then
     echo "[setupvars.sh] ERROR: Unsupported Python version. Please install one of Python 3.6-${MAX_SUPPORTED_PYTHON_VERSION} (64-bit) from https://www.python.org/downloads/"
     return 1
diff --git a/tests/conditional_compilation/CMakeLists.txt b/tests/conditional_compilation/CMakeLists.txt
new file mode 100644
index 00000000000..9f50d8dcc6a
--- /dev/null
+++ b/tests/conditional_compilation/CMakeLists.txt
@@ -0,0 +1,10 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+cmake_minimum_required(VERSION 3.13)
+
+project(conditional_compilation_tests)
+
+install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} DESTINATION tests COMPONENT tests EXCLUDE_FROM_ALL)
+install(DIRECTORY ../utils/ DESTINATION tests/utils COMPONENT tests EXCLUDE_FROM_ALL)
diff --git a/tests/conditional_compilation/conftest.py b/tests/conditional_compilation/conftest.py
index 3c246e3b379..513871f2110 100644
--- a/tests/conditional_compilation/conftest.py
+++ b/tests/conditional_compilation/conftest.py
@@ -243,34 +243,42 @@ def prepare_omz_model(openvino_ref, model, omz_repo, omz_cache_dir, tmpdir):
     downloader_path = omz_repo / "tools" / "downloader" / "downloader.py"
     model_path_root = tmpdir
 
-    cmd = f'{python_executable} {downloader_path} --name {model["name"]}' \
-          f' --precisions={model["precision"]}' \
-          f' --num_attempts {OMZ_NUM_ATTEMPTS}' \
-          f' --output_dir {model_path_root}'
+    cmd = [f'{python_executable}', f'{downloader_path}',
+           '--name', f'{model["name"]}',
+           f'--precisions={model["precision"]}',
+           '--num_attempts', f'{OMZ_NUM_ATTEMPTS}',
+           '--output_dir', f'{model_path_root}']
 
     if omz_cache_dir:
-        cmd += f' --cache_dir {omz_cache_dir}'
+        cmd.append('--cache_dir')
+        cmd.append(f'{omz_cache_dir}')
 
-    cmd_exec(cmd, log=omz_log)
+    return_code, output = cmd_exec(cmd, log=omz_log)
+    assert return_code == 0, "Downloading OMZ models has failed!"
 
     # Step 2: converter
     converter_path = omz_repo / "tools" / "downloader" / "converter.py"
     ir_path = model_path_root / "_IR"
     # Note: remove --precisions if both precisions (FP32 & FP16) are required
-    cmd = f'{python_executable} {converter_path} --name {model["name"]}' \
-          f' -p {python_executable}' \
-          f' --precisions={model["precision"]}' \
-          f' --output_dir {ir_path}' \
-          f' --download_dir {model_path_root}' \
-          f' --mo {Path("../../model-optimizer/mo.py").resolve()}'
+    cmd = [f'{python_executable}', f'{converter_path}',
+           '--name', f'{model["name"]}',
+           '-p', f'{python_executable}',
+           f'--precisions={model["precision"]}',
+           '--output_dir', f'{ir_path}',
+           '--download_dir', f'{model_path_root}',
+           '--mo', f'{openvino_ref / "tools"/ "model_optimizer" / "mo.py"}']
 
-    cmd_exec(cmd, env=get_openvino_environment(openvino_ref), log=omz_log)
+    return_code, output = cmd_exec(cmd, env=get_openvino_environment(openvino_ref), log=omz_log)
+    assert return_code == 0, "Converting OMZ models has failed!"
 
     # Step 3: info_dumper
     info_dumper_path = omz_repo / "tools" / "downloader" / "info_dumper.py"
-    cmd = f'"{python_executable}" "{info_dumper_path}" --name {model["name"]}'
+    cmd = [f'{python_executable}',
+           f'{info_dumper_path}',
+           '--name', f'{model["name"]}']
 
     return_code, output = cmd_exec(cmd, log=omz_log)
+    assert return_code == 0, "Getting information about OMZ models has failed!"
     model_info = json.loads(output)[0]
 
     # Step 4: form model_path
diff --git a/tests/stress_tests/.automation/memcheck_tests/precommit_configs/desktop_references_config.xml b/tests/stress_tests/.automation/memcheck_tests/precommit_configs/desktop_references_config.xml
index fadaaabfcc5..042e7745a12 100644
--- a/tests/stress_tests/.automation/memcheck_tests/precommit_configs/desktop_references_config.xml
+++ b/tests/stress_tests/.automation/memcheck_tests/precommit_configs/desktop_references_config.xml
@@ -1,91 +1,92 @@
 <?xml version="1.0"?>
 <attributes>
     <models>
+        # values from {"commit_id": "12d731e59266e19e97b69406db359cb9541bc010", "commit_date": "2021-09-17 11:44"} and *= 1.3
         <!--Models with FP32 precision-->
-        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="740214" vmpeak="805110" vmrss="129308" vmhwm="129308" />
-        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="2554255" vmpeak="2575892" vmrss="535334" vmhwm="1223398" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="1351818" vmpeak="1437014" vmrss="143057" vmhwm="143057" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="2751751" vmpeak="2836948" vmrss="582176" vmhwm="1249487" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="1007890" vmpeak="1007890" vmrss="138652" vmhwm="138652" />
-        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="2640835" vmpeak="2726032" vmrss="538382" vmhwm="1228006" /> # values from {"branch": "releases/2021/4",  "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="819504" vmpeak="819504" vmrss="103740" vmhwm="103740" />
+        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="1583712" vmpeak="1607387" vmrss="498170" vmhwm="771976" />
+        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="994255" vmpeak="1035720" vmrss="155506" vmhwm="155506" />
+        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="1784421" vmpeak="1869618" vmrss="501581" vmhwm="754634" />
+        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="820887" vmpeak="820887" vmrss="114363" vmhwm="114363" />
+        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="1667380" vmpeak="1667380" vmrss="472123" vmhwm="753719" />
 
-        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="691589" vmpeak="922864" vmrss="31054" vmhwm="31054" />
-        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="1965792" vmpeak="1986301" vmrss="251992" vmhwm="410316" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="1369586" vmpeak="1454783" vmrss="26634" vmhwm="26634" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="2146809" vmpeak="2232006" vmrss="253271" vmhwm="410794" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="958240" vmpeak="1043437" vmrss="31366" vmhwm="31366" />
-        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="2050984" vmpeak="2050984" vmrss="252309" vmhwm="410451" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="714792" vmpeak="714792" vmrss="32432" vmhwm="32432" />
+        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="1516876" vmpeak="1537109" vmrss="265798" vmhwm="340506" />
+        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="815084" vmpeak="815084" vmrss="35053" vmhwm="35053" />
+        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="1697930" vmpeak="1783126" vmrss="266214" vmhwm="340667" />
+        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="715192" vmpeak="715192" vmrss="33404" vmhwm="33404" />
+        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="1602166" vmpeak="1687363" vmrss="265257" vmhwm="340563" />
 
-        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="1050000" vmpeak="1179042" vmrss="323000" vmhwm="439457" />
-        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="2834738" vmpeak="2886488" vmrss="833331" vmhwm="1464366" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="1569401" vmpeak="1570774" vmrss="497967" vmhwm="497967" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="3074453" vmpeak="3074453" vmrss="899652" vmhwm="1462297" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="1321819" vmpeak="1321819" vmrss="374207" vmhwm="439748" />
-        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="2917262" vmpeak="2917262" vmrss="862830" vmhwm="1509835" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="1054892" vmpeak="1054892" vmrss="292962" vmhwm="292962" />
+        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="1887948" vmpeak="1925471" vmrss="792849" vmhwm="1081917" />
+        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="1573000" vmpeak="1574372" vmrss="506974" vmhwm="506974" />
+        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="2186204" vmpeak="2271401" vmrss="904259" vmhwm="1060805" />
+        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="1063322" vmpeak="1063322" vmrss="357931" vmhwm="357931" />
+        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="1976213" vmpeak="2061410" vmrss="780624" vmhwm="1061335" />
 
-        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="2300000" vmpeak="2836412" vmrss="1570000" vmhwm="2140533" />
-        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="3590771" vmpeak="4719837" vmrss="1876217" vmhwm="3028786" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="3255907" vmpeak="3256676" vmrss="2063937" vmhwm="2063937" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="3786489" vmpeak="4816884" vmrss="1891172" vmhwm="3027060" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="2800000" vmpeak="2836412" vmrss="1590000" vmhwm="2140377" />
-        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="3665173" vmpeak="4627511" vmrss="1853924" vmhwm="3027278" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="2054364" vmpeak="2054364" vmrss="1331959" vmhwm="1331959" />
+        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="2974961" vmpeak="3641424" vmrss="1749748" vmhwm="2555014" />
+        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="3079637" vmpeak="3079637" vmrss="2074482" vmhwm="2074482" />
+        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="3217801" vmpeak="3738118" vmrss="1811082" vmhwm="2535015" />
+        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="2054764" vmpeak="2054764" vmrss="1365842" vmhwm="1365842" />
+        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="3063273" vmpeak="3641591" vmrss="1777734" vmhwm="2582034" />
 
         <!--Models with FP16 precision-->
-        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="1057487" vmpeak="1085224" vmrss="109694" vmhwm="137295" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="2517418" vmpeak="2539108" vmrss="532485" vmhwm="1249050" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="1279876" vmpeak="1365072" vmrss="156566" vmhwm="156566" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2693719" vmpeak="2778916" vmrss="541034" vmhwm="1250189" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="1058844" vmpeak="1085224" vmrss="123016" vmhwm="136682" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="2598715" vmpeak="2683912" vmrss="529250" vmhwm="1245504" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="833133" vmpeak="833133" vmrss="118128" vmhwm="118128" />
+        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="1535476" vmpeak="1566052" vmrss="462410" vmhwm="789001" />
+        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="1007588" vmpeak="1008961" vmrss="168225" vmhwm="168225" />
+        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="1727902" vmpeak="1813099" vmrss="469164" vmhwm="764197" />
+        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="834516" vmpeak="834516" vmrss="128102" vmhwm="128102" />
+        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="1623206" vmpeak="1708402" vmrss="459144" vmhwm="762455" />
 
-        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="955427" vmpeak="955806" vmrss="27700" vmhwm="27700" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="1964518" vmpeak="1988079" vmrss="262563" vmhwm="462222" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="906443" vmpeak="986913" vmrss="27404" vmhwm="27404" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2145587" vmpeak="2230784" vmrss="263468" vmhwm="462207" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="955827" vmpeak="955827" vmrss="27222" vmhwm="27222" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="2049808" vmpeak="2049808" vmrss="262230" vmhwm="461962" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="714942" vmpeak="714942" vmrss="33004" vmhwm="33004" />
+        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="1524187" vmpeak="1549865" vmrss="244857" vmhwm="363906" />
+        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="815235" vmpeak="892377" vmrss="36332" vmhwm="36332" />
+        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="1691196" vmpeak="1776392" vmrss="265616" vmhwm="362377" />
+        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="912386" vmpeak="912386" vmrss="34309" vmhwm="34309" />
+        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="1595469" vmpeak="1680666" vmrss="268387" vmhwm="385330" />
 
-        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="1372961" vmpeak="1505639" vmrss="380000" vmhwm="501649" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="2603416" vmpeak="2604170" vmrss="646604" vmhwm="1286537" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="1816224" vmpeak="1870970" vmrss="561241" vmhwm="561241" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2803117" vmpeak="2888314" vmrss="670711" vmhwm="1284150" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="1381265" vmpeak="1505472" vmrss="437039" vmhwm="500630" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="2688202" vmpeak="2773399" vmrss="657810" vmhwm="1300488" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="1120184" vmpeak="1120184" vmrss="359200" vmhwm="359200" />
+        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="1630569" vmpeak="1752530" vmrss="546364" vmhwm="874426" />
+        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="1457409" vmpeak="1458782" vmrss="572577" vmhwm="572577" />
+        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="1856405" vmpeak="1941602" vmrss="578843" vmhwm="872071" />
+        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="1309838" vmpeak="1386434" vmrss="421626" vmhwm="421626" />
+        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="1711881" vmpeak="1797078" vmrss="544310" vmhwm="875368" />
 
-        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="2748220" vmpeak="3450818" vmrss="1840000" vmhwm="2486161" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="2764710" vmpeak="3315140" vmrss="1048127" vmhwm="1587118" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="3607037" vmpeak="3607806" vmrss="2415992" vmhwm="2415992" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2967858" vmpeak="3406124" vmrss="1058657" vmhwm="1575516" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
-        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="2749458" vmpeak="3450818" vmrss="1860000" vmhwm="2486525" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="2847364" vmpeak="3310273" vmrss="1032465" vmhwm="1578205" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="2405114" vmpeak="2405114" vmrss="1683084" vmhwm="1683084" />
+        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="2206724" vmpeak="2551770" vmrss="1023926" vmhwm="1487049" />
+        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="3430388" vmpeak="3600781" vmrss="2424016" vmhwm="2424016" />
+        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2408536" vmpeak="2649150" vmrss="1052251" vmhwm="1493044" />
+        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="2406284" vmpeak="2490311" vmrss="1716967" vmhwm="1716967" />
+        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="2292227" vmpeak="2549414" vmrss="1002950" vmhwm="1461891" />
 
         <!--Models with FP16-INT8 precision-->
-        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="845462" vmpeak="845462" vmrss="54277" vmhwm="54277" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="1917323" vmpeak="1917739" vmrss="581136" vmhwm="949936" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="inference_with_streams" device="CPU" vmsize="1629425" vmpeak="1633361" vmrss="77937" vmhwm="77937" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="inference_with_streams" device="GPU" vmsize="2147454" vmpeak="2232651" vmrss="671205" vmhwm="969524" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="infer_request_inference" device="CPU" vmsize="939926" vmpeak="939926" vmrss="61235" vmhwm="61235" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="infer_request_inference" device="GPU" vmsize="2009384" vmpeak="2094580" vmrss="583086" vmhwm="944008" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
+        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="774961" vmpeak="774961" vmrss="57798" vmhwm="57798" />
+        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="1570218" vmpeak="1570888" vmrss="597532" vmhwm="950341" />
+        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="inference_with_streams" device="CPU" vmsize="929905" vmpeak="933842" vmrss="82050" vmhwm="82050" />
+        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="inference_with_streams" device="GPU" vmsize="1793214" vmpeak="1878411" vmrss="634275" vmhwm="947356" />
+        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="infer_request_inference" device="CPU" vmsize="778887" vmpeak="778887" vmrss="65764" vmhwm="65764" />
+        <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="infer_request_inference" device="GPU" vmsize="1656538" vmpeak="1741734" vmrss="615196" vmhwm="948500" />
 
-        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="985509" vmpeak="985509" vmrss="102684" vmhwm="102684" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="3018548" vmpeak="3038781" vmrss="1967492" vmhwm="2351637" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="inference_with_streams" device="CPU" vmsize="1893320" vmpeak="1897464" vmrss="153072" vmhwm="153072" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="inference_with_streams" device="GPU" vmsize="3234410" vmpeak="3319607" vmrss="1993123" vmhwm="2356712" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="infer_request_inference" device="CPU" vmsize="989825" vmpeak="989825" vmrss="112465" vmhwm="112465" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="infer_request_inference" device="GPU" vmsize="3102907" vmpeak="3188104" vmrss="1959562" vmhwm="2354128" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
+        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="923795" vmpeak="923795" vmrss="116974" vmhwm="116974" />
+        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="2667496" vmpeak="2687729" vmrss="1880944" vmhwm="2145462" />
+        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="inference_with_streams" device="CPU" vmsize="1197664" vmpeak="1201808" vmrss="170669" vmhwm="170669" />
+        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="inference_with_streams" device="GPU" vmsize="2887528" vmpeak="2972725" vmrss="1921098" vmhwm="2134969" />
+        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="infer_request_inference" device="CPU" vmsize="927945" vmpeak="927945" vmrss="125959" vmhwm="125959" />
+        <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="infer_request_inference" device="GPU" vmsize="2751954" vmpeak="2751954" vmrss="1885722" vmhwm="2143528" />
 
-        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="998602" vmpeak="998602" vmrss="67246" vmhwm="67246" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="2190047" vmpeak="2190047" vmrss="624036" vmhwm="624036" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="inference_with_streams" device="CPU" vmsize="2004033" vmpeak="2069199" vmrss="334141" vmhwm="334250" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="inference_with_streams" device="GPU" vmsize="2799196" vmpeak="2799196" vmrss="1061351" vmhwm="1061351" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="infer_request_inference" device="CPU" vmsize="1063769" vmpeak="1063769" vmrss="297944" vmhwm="297944" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="infer_request_inference" device="GPU" vmsize="2364830" vmpeak="2450026" vmrss="711063" vmhwm="711063" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
+        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="928678" vmpeak="928678" vmrss="70532" vmhwm="70532" />
+        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="1836962" vmpeak="1836962" vmrss="621956" vmhwm="621956" />
+        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="inference_with_streams" device="CPU" vmsize="1305746" vmpeak="1370912" vmrss="338520" vmhwm="338561" />
+        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="inference_with_streams" device="GPU" vmsize="2446579" vmpeak="2531776" vmrss="1056229" vmhwm="1056239" />
+        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="infer_request_inference" device="CPU" vmsize="993844" vmpeak="993844" vmrss="301698" vmhwm="301698" />
+        <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="infer_request_inference" device="GPU" vmsize="2013871" vmpeak="2099068" vmrss="721000" vmhwm="721000" />
 
-        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="792677" vmpeak="866647" vmrss="33794" vmhwm="33794" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="1850950" vmpeak="1871251" vmrss="265959" vmhwm="410160" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="inference_with_streams" device="CPU" vmsize="1527453" vmpeak="1527453" vmrss="36462" vmhwm="36462" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="inference_with_streams" device="GPU" vmsize="2028130" vmpeak="2113326" vmrss="249808" vmhwm="408948" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="infer_request_inference" device="CPU" vmsize="792677" vmpeak="866647" vmrss="33113" vmhwm="33113" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
-        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="infer_request_inference" device="GPU" vmsize="1932590" vmpeak="2017787" vmrss="246838" vmhwm="410576" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
+        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="722924" vmpeak="722924" vmrss="37622" vmhwm="37622" />
+        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="1498146" vmpeak="1521130" vmrss="244857" vmhwm="411824" />
+        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="inference_with_streams" device="CPU" vmsize="829342" vmpeak="829342" vmrss="39280" vmhwm="39280" />
+        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="inference_with_streams" device="GPU" vmsize="1679298" vmpeak="1679298" vmrss="247187" vmhwm="410430" />
+        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="infer_request_inference" device="CPU" vmsize="637728" vmpeak="722924" vmrss="38490" vmhwm="38490" />
+        <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="infer_request_inference" device="GPU" vmsize="1583514" vmpeak="1668711" vmrss="267857" vmhwm="410779" />
     </models>
 </attributes>
diff --git a/tests/stress_tests/.automation/memleaks_tests/nightly_configs/desktop_test_config.xml b/tests/stress_tests/.automation/memleaks_tests/nightly_configs/desktop_test_config.xml
index 060fffc897c..4ecda8c7807 100644
--- a/tests/stress_tests/.automation/memleaks_tests/nightly_configs/desktop_test_config.xml
+++ b/tests/stress_tests/.automation/memleaks_tests/nightly_configs/desktop_test_config.xml
@@ -1,21 +1,15 @@
-<attributes>
-    <processes>
-        <value>1</value>
-    </processes>
-    <threads>
-        <value>1</value>
-    </threads>
-    <iterations>
-        <value>1000</value>
-    </iterations>
-    <devices>
-        <value>CPU</value>
-        <value>GPU</value>
-    </devices>
-    <models>
-        <!-- Alexnet model contains MatMul node which is needed to cover *-52623 -->
+<cases>
+
+    <device name="CPU" iterations="1000" processes="1" threads="1">
         <model name="alexnet" precision="FP32" source="omz" />
         <model name="mobilenet-ssd" precision="FP32" source="omz" />
         <model name="mtcnn-r" precision="FP32" source="omz" />
-    </models>
-</attributes>
\ No newline at end of file
+    </device>
+
+    <device name="GPU" iterations="1000" processes="1" threads="1">
+        <model name="alexnet" precision="FP32" source="omz" />
+        <model name="mobilenet-ssd" precision="FP32" source="omz" />
+        <model name="mtcnn-r" precision="FP32" source="omz" />
+    </device>
+
+</cases>
diff --git a/tests/stress_tests/.automation/memleaks_tests/nightly_configs/myriad_test_config.xml b/tests/stress_tests/.automation/memleaks_tests/nightly_configs/myriad_test_config.xml
index 3718751b253..2b8848cee9f 100644
--- a/tests/stress_tests/.automation/memleaks_tests/nightly_configs/myriad_test_config.xml
+++ b/tests/stress_tests/.automation/memleaks_tests/nightly_configs/myriad_test_config.xml
@@ -1,19 +1,9 @@
-<attributes>
-    <processes>
-        <value>1</value>
-    </processes>
-    <threads>
-        <value>1</value>
-    </threads>
-    <iterations>
-        <value>1000</value>
-    </iterations>
-    <devices>
-        <value>MYRIAD</value>
-    </devices>
-    <models>
+<cases>
+
+    <device name="MYRIAD" iterations="1000" processes="1" threads="1">
         <model name="alexnet" precision="FP32" source="omz" />
         <model name="mobilenet-ssd" precision="FP32" source="omz" />
         <model name="mtcnn-r" precision="FP32" source="omz" />
-    </models>
-</attributes>
\ No newline at end of file
+    </device>
+
+</cases>
diff --git a/tests/stress_tests/.automation/memleaks_tests/precommit_configs/desktop_test_config.xml b/tests/stress_tests/.automation/memleaks_tests/precommit_configs/desktop_test_config.xml
index 12cd28c0c8c..4909b6411f1 100644
--- a/tests/stress_tests/.automation/memleaks_tests/precommit_configs/desktop_test_config.xml
+++ b/tests/stress_tests/.automation/memleaks_tests/precommit_configs/desktop_test_config.xml
@@ -1,18 +1,11 @@
-<attributes>
-    <processes>
-        <value>1</value>
-    </processes>
-    <threads>
-        <value>1</value>
-    </threads>
-    <iterations>
-        <value>30</value>
-    </iterations>
-    <devices>
-        <value>CPU</value>
-        <value>GPU</value>
-    </devices>
-    <models>
+<cases>
+
+    <device name="CPU" iterations="30" processes="1" threads="1">
         <model name="mobilenet-ssd" precision="FP32" source="omz" />
-    </models>
-</attributes>
\ No newline at end of file
+    </device>
+
+    <device name="GPU" iterations="30" processes="1" threads="1">
+        <model name="mobilenet-ssd" precision="FP32" source="omz" />
+    </device>
+
+</cases>
diff --git a/tests/stress_tests/.automation/memleaks_tests/weekly_configs/desktop_test_config.xml b/tests/stress_tests/.automation/memleaks_tests/weekly_configs/desktop_test_config.xml
index 95bced89a1f..d0862a42b8c 100644
--- a/tests/stress_tests/.automation/memleaks_tests/weekly_configs/desktop_test_config.xml
+++ b/tests/stress_tests/.automation/memleaks_tests/weekly_configs/desktop_test_config.xml
@@ -1,21 +1,15 @@
-<attributes>
-    <processes>
-        <value>1</value>
-    </processes>
-    <threads>
-        <value>1</value>
-    </threads>
-    <iterations>
-        <value>5000</value>
-    </iterations>
-    <devices>
-        <value>CPU</value>
-        <value>GPU</value>
-    </devices>
-    <models>
-        <!-- Alexnet model contains MatMul node which is needed to cover *-52623 -->
+<cases>
+
+    <device name="CPU" iterations="5000" processes="1" threads="1">
         <model name="alexnet" precision="FP32" source="omz" />
         <model name="mobilenet-ssd" precision="FP32" source="omz" />
         <model name="mtcnn-r" precision="FP32" source="omz" />
-    </models>
-</attributes>
\ No newline at end of file
+    </device>
+
+    <device name="GPU" iterations="5000" processes="1" threads="1">
+        <model name="alexnet" precision="FP32" source="omz" />
+        <model name="mobilenet-ssd" precision="FP32" source="omz" />
+        <model name="mtcnn-r" precision="FP32" source="omz" />
+    </device>
+
+</cases>
diff --git a/tests/stress_tests/README.md b/tests/stress_tests/README.md
index b1258878640..78800463372 100644
--- a/tests/stress_tests/README.md
+++ b/tests/stress_tests/README.md
@@ -36,7 +36,7 @@ To build the tests, you need to have OpenVINO™ installed or build from source.
 Before build the tests, open a terminal, set OpenVINO™ environment, and after that
 run the commands below:
 ``` bash
-source <OpenVINO_install_dir>/bin/setupvars.sh
+source <OpenVINO_install_dir>/setupvars.sh
 mkdir build && cd build
 cmake .. && make -j$(nproc)
 ```
diff --git a/tests/stress_tests/common/tests_utils.cpp b/tests/stress_tests/common/tests_utils.cpp
index 82cd7c5ab68..9592119cdce 100644
--- a/tests/stress_tests/common/tests_utils.cpp
+++ b/tests/stress_tests/common/tests_utils.cpp
@@ -5,22 +5,19 @@
 #include "tests_utils.h"
 
 #include <gtest/gtest.h>
+#include <map>
 #include <pugixml.hpp>
 #include <string>
 
 #define DEBUG_MODE false
 
-const pugi::xml_document & Environment::getTestConfig() {
-    return _test_config;
-}
+const pugi::xml_document &Environment::getTestConfig() { return _test_config; }
 
-void Environment::setTestConfig(const pugi::xml_document &test_config) {
-    _test_config.reset(test_config);
-}
+void Environment::setTestConfig(const pugi::xml_document &test_config) { _test_config.reset(test_config); }
 
 std::vector<TestCase> generateTestsParams(std::initializer_list<std::string> fields) {
     std::vector<TestCase> tests_cases;
-    const pugi::xml_document & test_config = Environment::Instance().getTestConfig();
+    const pugi::xml_document &test_config = Environment::Instance().getTestConfig();
 
     std::vector<int> processes, threads, iterations;
     std::vector<std::string> devices, models, models_names, precisions;
@@ -49,7 +46,8 @@ std::vector<TestCase> generateTestsParams(std::initializer_list<std::string> fie
                 std::string full_path = val.attribute("full_path").as_string();
                 std::string path = val.attribute("path").as_string();
                 if (full_path.empty() || path.empty())
-                    throw std::logic_error("One of the 'model' records from test config doesn't contain 'full_path' or 'path' attributes");
+                    throw std::logic_error("One of the 'model' records from test config doesn't contain 'full_path' or "
+                                           "'path' attributes");
                 else {
                     models.push_back(full_path);
                     models_names.push_back(path);
@@ -61,9 +59,9 @@ std::vector<TestCase> generateTestsParams(std::initializer_list<std::string> fie
     }
 
     // Initialize variables with default value if it weren't filled
-    processes = !processes.empty() ? processes: std::vector<int>{1};
-    threads = !threads.empty() ? threads: std::vector<int>{1};
-    iterations = !iterations.empty() ? iterations: std::vector<int>{1};
+    processes = !processes.empty() ? processes : std::vector<int>{1};
+    threads = !threads.empty() ? threads : std::vector<int>{1};
+    iterations = !iterations.empty() ? iterations : std::vector<int>{1};
     devices = !devices.empty() ? devices : std::vector<std::string>{"NULL"};
     models = !models.empty() ? models : std::vector<std::string>{"NULL"};
     precisions = !precisions.empty() ? precisions : std::vector<std::string>{"NULL"};
@@ -74,7 +72,47 @@ std::vector<TestCase> generateTestsParams(std::initializer_list<std::string> fie
             for (auto &numiters : iterations)
                 for (auto &device : devices)
                     for (int i = 0; i < models.size(); i++)
-                        tests_cases.push_back(TestCase(numprocesses, numthreads, numiters, device, models[i], models_names[i], precisions[i]));
+                        tests_cases.push_back(TestCase(numprocesses, numthreads, numiters, device, models[i],
+                                                       models_names[i], precisions[i]));
+    return tests_cases;
+}
+
+// Generate multi-model test cases from config file with static test definition.
+std::vector<MemLeaksTestCase> generateTestsParamsMemLeaks() {
+    std::vector<MemLeaksTestCase> tests_cases;
+    const pugi::xml_document &test_config = Environment::Instance().getTestConfig();
+
+    int numprocesses, numthreads, numiterations;
+    std::string device_name;
+
+    pugi::xml_node cases;
+    cases = test_config.child("cases");
+
+    for (pugi::xml_node device = cases.first_child(); device; device = device.next_sibling()) {
+        device_name = device.attribute("name").as_string("NULL");
+        numprocesses = device.attribute("processes").as_int(1);
+        numthreads = device.attribute("threads").as_int(1);
+        numiterations = device.attribute("iterations").as_int(1);
+
+        std::vector<std::map<std::string, std::string>> models;
+
+        for (pugi::xml_node model = device.first_child(); model; model = model.next_sibling()) {
+            std::string full_path = model.attribute("full_path").as_string();
+            std::string path = model.attribute("path").as_string();
+            if (full_path.empty() || path.empty())
+                throw std::logic_error(
+                        "One of the 'model' records from test config doesn't contain 'full_path' or 'path' attributes");
+            std::string name = model.attribute("name").as_string();
+            std::string precision = model.attribute("precision").as_string();
+            std::map<std::string, std::string> model_map{{"name", name},
+                                                         {"path", path},
+                                                         {"full_path", full_path},
+                                                         {"precision", precision}};
+            models.push_back(model_map);
+        }
+        tests_cases.push_back(MemLeaksTestCase(numprocesses, numthreads, numiterations, device_name, models));
+    }
+
     return tests_cases;
 }
 
@@ -82,6 +120,10 @@ std::string getTestCaseName(const testing::TestParamInfo<TestCase> &obj) {
     return obj.param.test_case_name;
 }
 
+std::string getTestCaseNameMemLeaks(const testing::TestParamInfo<MemLeaksTestCase> &obj) {
+    return obj.param.test_case_name;
+}
+
 void test_wrapper(const std::function<void(std::string, std::string, int)> &tests_pipeline, const TestCase &params) {
     tests_pipeline(params.model, params.device, params.numiters);
 }
@@ -94,8 +136,7 @@ void runTest(const std::function<void(std::string, std::string, int)> &tests_pip
 #if DEBUG_MODE
     tests_pipeline(params.model, params.device, params.numiters);
 #else
-    int status = run_in_processes(params.numprocesses, [&](){ _runTest(tests_pipeline, params); });
+    int status = run_in_processes(params.numprocesses, [&]() { _runTest(tests_pipeline, params); });
     ASSERT_EQ(status, 0) << "Test failed with exitcode " << std::to_string(status);
 #endif
 }
-
diff --git a/tests/stress_tests/common/tests_utils.h b/tests/stress_tests/common/tests_utils.h
index 42cb40fcdf0..83e490702bf 100644
--- a/tests/stress_tests/common/tests_utils.h
+++ b/tests/stress_tests/common/tests_utils.h
@@ -9,69 +9,90 @@
 #include <gtest/gtest.h>
 #include <pugixml.hpp>
 #include <string>
-#include <vector>
 #include <thread>
+#include <vector>
 
 
-enum TestStatus
-{
-    TEST_NOT_STARTED = 0,
-    TEST_FAILED,
-    TEST_OK
-};
+enum TestStatus { TEST_NOT_STARTED = 0, TEST_FAILED, TEST_OK };
 
 using TestResult = std::pair<TestStatus, std::string>;
 
-class TestCase {
+class TestCaseBase {
 public:
     int numprocesses;
     int numthreads;
     int numiters;
-    std::string device;
-    std::string model_name;
-    std::string model;
     std::string precision;
     std::string test_case_name;
+    std::string model_name;
+    std::string device;
 
-    TestCase(int _numprocesses, int _numthreads, int _numiters, std::string _device, const std::string& _model, const std::string& _model_name, const std::string& _precision) {
-        numprocesses = _numprocesses, numthreads = _numthreads, numiters = _numiters, device = _device, model = _model, model_name = _model_name, precision = _precision;
-        test_case_name =
-                "Numprocesses_" + std::to_string(numprocesses) + "_Numthreads_" + std::to_string(numthreads) +
-                "_Numiters_" + std::to_string(numiters) + "_Device_" + update_item_for_name(device) + "_Precision_" +
-                update_item_for_name(precision) + "_Model_" + update_item_for_name(model_name);
-    }
-
-private:
+protected:
+    // Replace non-alphabetic/numeric symbols with "_" to prevent logging errors
     std::string update_item_for_name(const std::string &item) {
         std::string _item(item);
         for (std::string::size_type index = 0; index < _item.size(); ++index) {
-            if (!isalnum(_item[index]) && _item[index] != '_')
-                _item[index] = '_';
+            if (!isalnum(_item[index]) && _item[index] != '_') _item[index] = '_';
         }
         return _item;
     }
 };
 
+class TestCase : public TestCaseBase {
+public:
+    std::string model;
+
+    TestCase(int _numprocesses, int _numthreads, int _numiters, std::string _device, const std::string &_model,
+             const std::string &_model_name, const std::string &_precision) {
+        numprocesses = _numprocesses, numthreads = _numthreads, numiters = _numiters, device = _device, model = _model,
+        model_name = _model_name, precision = _precision;
+        test_case_name = "Numprocesses_" + std::to_string(numprocesses) + "_Numthreads_" + std::to_string(numthreads) +
+                         "_Numiters_" + std::to_string(numiters) + "_Device_" + update_item_for_name(device) +
+                         "_Precision_" + update_item_for_name(precision) + "_Model_" + update_item_for_name(model_name);
+    }
+};
+
+class MemLeaksTestCase : public TestCaseBase {
+public:
+    std::vector<std::map<std::string, std::string>> models;
+
+    MemLeaksTestCase(int _numprocesses, int _numthreads, int _numiters, std::string _device,
+                     std::vector<std::map<std::string, std::string>> _models) {
+        numprocesses = _numprocesses, numthreads = _numthreads, numiters = _numiters, device = _device,
+        models = _models;
+        test_case_name = "Numprocesses_" + std::to_string(numprocesses) + "_Numthreads_" + std::to_string(numthreads) +
+                         "_Numiters_" + std::to_string(numiters) + "_Device_" + update_item_for_name(device);
+        for (int i = 0; i < models.size(); i++) {
+            test_case_name += "_Model" + std::to_string(i + 1) + "_" + update_item_for_name(models[i]["name"]) + "_" +
+                              update_item_for_name(models[i]["precision"]);
+            model_name += "\"" + models[i]["path"] + "\"" + (i < models.size() - 1 ? ", " : "");
+        }
+    }
+};
+
 class Environment {
 private:
     pugi::xml_document _test_config;
     bool _collect_results_only = false;
 
     Environment() = default;
-    Environment(const Environment&) = delete;
-    Environment& operator=(const Environment&) = delete;
+    Environment(const Environment &) = delete;
+    Environment &operator=(const Environment &) = delete;
+
 public:
-    static Environment& Instance(){
+    static Environment &Instance() {
         static Environment env;
         return env;
     }
 
-    const pugi::xml_document & getTestConfig();
+    const pugi::xml_document &getTestConfig();
     void setTestConfig(const pugi::xml_document &test_config);
 };
 
 std::vector<TestCase> generateTestsParams(std::initializer_list<std::string> items);
+std::vector<MemLeaksTestCase> generateTestsParamsMemLeaks();
 std::string getTestCaseName(const testing::TestParamInfo<TestCase> &obj);
+std::string getTestCaseNameMemLeaks(const testing::TestParamInfo<MemLeaksTestCase> &obj);
 
 void runTest(const std::function<void(std::string, std::string, int)> &tests_pipeline, const TestCase &params);
 void _runTest(const std::function<void(std::string, std::string, int)> &tests_pipeline, const TestCase &params);
diff --git a/tests/stress_tests/memleaks_tests/tests.cpp b/tests/stress_tests/memleaks_tests/tests.cpp
index 7eedd5d541c..a24881590ee 100644
--- a/tests/stress_tests/memleaks_tests/tests.cpp
+++ b/tests/stress_tests/memleaks_tests/tests.cpp
@@ -2,9 +2,9 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
+#include "../common/managers/thread_manager.h"
 #include "../common/tests_utils.h"
 #include "common_utils.h"
-#include "../common/managers/thread_manager.h"
 #include "tests_pipelines/tests_pipelines.h"
 
 #include <inference_engine.hpp>
@@ -13,19 +13,15 @@
 
 using namespace InferenceEngine;
 
-class MemLeaksTestSuiteNoModel : public ::testing::TestWithParam<TestCase> {
-};
+class MemLeaksTestSuiteNoModel : public ::testing::TestWithParam<MemLeaksTestCase> {};
 
-class MemLeaksTestSuiteNoDevice : public ::testing::TestWithParam<TestCase> {
-};
+class MemLeaksTestSuiteNoDevice : public ::testing::TestWithParam<MemLeaksTestCase> {};
 
-class MemLeaksTestSuite : public ::testing::TestWithParam<TestCase> {
-};
+class MemLeaksTestSuite : public ::testing::TestWithParam<MemLeaksTestCase> {};
 
 inline void test_runner(int numthreads, const std::function<TestResult()> &test_function) {
     ThreadManager<TestResult> thr_manager;
-    for (int i = 0; i < numthreads; i++)
-        thr_manager.add_task(test_function);
+    for (int i = 0; i < numthreads; i++) thr_manager.add_task(test_function);
     thr_manager.run_parallel_n_wait();
 
     std::vector<ManagerStatus> statuses = thr_manager.get_all_statuses();
@@ -33,41 +29,64 @@ inline void test_runner(int numthreads, const std::function<TestResult()> &test_
 
     for (int i = 0; i < numthreads; i++) {
         EXPECT_EQ(statuses[i], ManagerStatus::FINISHED_SUCCESSFULLY)
-                            << "[Thread " << i << "] Thread not finished successfully";
+                << "[Thread " << i << "] Thread not finished successfully";
         EXPECT_EQ(results[i].first, TestStatus::TEST_OK) << "[Thread " << i << "] " << results[i].second;
     }
 }
 
-
 // tests_pipelines/tests_pipelines.cpp
 TEST_P(MemLeaksTestSuiteNoModel, load_unload_plugin) {
     auto test_params = GetParam();
+
+    std::vector<std::function<void()>> pipeline = {load_unload_plugin(test_params.device)};
     auto test = [&] {
-        return test_load_unload_plugin(test_params.device, test_params.numiters);
+        log_info("Load/unload plugin for \"" << test_params.device << "\" device"
+                                             << " for " << test_params.numiters << " times");
+        return common_test_pipeline(pipeline, test_params.numiters);
     };
     test_runner(test_params.numthreads, test);
 }
 
 TEST_P(MemLeaksTestSuiteNoDevice, read_network) {
     auto test_params = GetParam();
+    std::vector<std::function<void()>> pipeline;
+
+    for (int i = 0; i < test_params.models.size(); i++) {
+        pipeline.push_back(read_cnnnetwork(test_params.models[i]["full_path"]));
+    }
     auto test = [&] {
-        return test_read_network(test_params.model, test_params.numiters);
+        log_info("Read networks: " << test_params.model_name << " for " << test_params.numiters << " times");
+        return common_test_pipeline(pipeline, test_params.numiters);
     };
     test_runner(test_params.numthreads, test);
 }
 
 TEST_P(MemLeaksTestSuiteNoDevice, cnnnetwork_reshape_batch_x2) {
     auto test_params = GetParam();
+    std::vector<std::function<void()>> pipeline;
+
+    for (int i = 0; i < test_params.models.size(); i++) {
+        pipeline.push_back(cnnnetwork_reshape_batch_x2(test_params.models[i]["full_path"]));
+    }
     auto test = [&] {
-        return test_cnnnetwork_reshape_batch_x2(test_params.model, test_params.numiters);
+        log_info("Reshape to batch*=2 of CNNNetworks created from networks: " << test_params.model_name << " for "
+                                                                              << test_params.numiters << " times");
+        return common_test_pipeline(pipeline, test_params.numiters);
     };
     test_runner(test_params.numthreads, test);
 }
 
 TEST_P(MemLeaksTestSuiteNoDevice, set_input_params) {
     auto test_params = GetParam();
+    std::vector<std::function<void()>> pipeline;
+
+    for (int i = 0; i < test_params.models.size(); i++) {
+        pipeline.push_back(set_input_params(test_params.models[i]["full_path"]));
+    }
     auto test = [&] {
-        return test_set_input_params(test_params.model, test_params.numiters);
+        log_info("Apply preprocessing for CNNNetworks from networks: " << test_params.model_name << " for "
+                                                                       << test_params.numiters << " times");
+        return common_test_pipeline(pipeline, test_params.numiters);
     };
     test_runner(test_params.numthreads, test);
 }
@@ -75,8 +94,16 @@ TEST_P(MemLeaksTestSuiteNoDevice, set_input_params) {
 TEST_P(MemLeaksTestSuite, recreate_exenetwork) {
     auto test_params = GetParam();
     Core ie;
+    std::vector<std::function<void()>> pipeline;
+
+    for (int i = 0; i < test_params.models.size(); i++) {
+        pipeline.push_back(recreate_exenetwork(ie, test_params.models[i]["full_path"], test_params.device));
+    }
     auto test = [&] {
-        return test_recreate_exenetwork(ie, test_params.model, test_params.device, test_params.numiters);
+        log_info("Recreate ExecutableNetworks within existing InferenceEngine::Core from networks: "
+                 << test_params.model_name << " for \"" << test_params.device << "\" device for "
+                 << test_params.numiters << " times");
+        return common_test_pipeline(pipeline, test_params.numiters);
     };
     test_runner(test_params.numthreads, test);
 }
@@ -84,62 +111,97 @@ TEST_P(MemLeaksTestSuite, recreate_exenetwork) {
 TEST_P(MemLeaksTestSuite, recreate_infer_request) {
     auto test_params = GetParam();
     Core ie;
-    CNNNetwork cnnNetwork = ie.ReadNetwork(test_params.model);
-    ExecutableNetwork exeNetwork = ie.LoadNetwork(cnnNetwork, test_params.device);
+    std::vector<std::function<void()>> pipeline;
+    std::vector<ExecutableNetwork> exeNetworks;
+
+    int n_models = test_params.models.size();
+    exeNetworks.reserve(n_models);
+
+    for (int i = 0; i < n_models; i++) {
+        CNNNetwork cnnNetwork = ie.ReadNetwork(test_params.models[i]["full_path"]);
+        ExecutableNetwork exeNetwork = ie.LoadNetwork(cnnNetwork, test_params.device);
+        exeNetworks.push_back(exeNetwork);
+        pipeline.push_back(recreate_infer_request(exeNetworks[i]));
+    }
     auto test = [&] {
-        return test_recreate_infer_request(exeNetwork, test_params.model, test_params.device, test_params.numiters);
+        log_info("Create InferRequests from networks: " << test_params.model_name << " for \"" << test_params.device
+                                                        << "\" device for " << test_params.numiters << " times");
+        return common_test_pipeline(pipeline, test_params.numiters);
     };
     test_runner(test_params.numthreads, test);
 }
 
 TEST_P(MemLeaksTestSuite, reinfer_request_inference) {
     auto test_params = GetParam();
-    auto test = [&] {
-        Core ie;
-        CNNNetwork cnnNetwork = ie.ReadNetwork(test_params.model);
+    Core ie;
+    std::vector<std::function<void()>> pipeline;
+    std::vector<InferRequest> infer_requests;
+    std::vector<OutputsDataMap> outputs_info;
+
+    int n_models = test_params.models.size();
+    infer_requests.reserve(n_models);
+    outputs_info.reserve(n_models);
+
+    for (int i = 0; i < n_models; i++) {
+        CNNNetwork cnnNetwork = ie.ReadNetwork(test_params.models[i]["full_path"]);
         ExecutableNetwork exeNetwork = ie.LoadNetwork(cnnNetwork, test_params.device);
         InferRequest infer_request = exeNetwork.CreateInferRequest();
-
+        infer_requests.push_back(infer_request);
         OutputsDataMap output_info(cnnNetwork.getOutputsInfo());
+        outputs_info.push_back(output_info);
         auto batchSize = cnnNetwork.getBatchSize();
         batchSize = batchSize != 0 ? batchSize : 1;
         const InferenceEngine::ConstInputsDataMap inputsInfo(exeNetwork.GetInputsInfo());
-        fillBlobs(infer_request, inputsInfo, batchSize);
-
-        return test_reinfer_request_inference(infer_request, output_info, test_params.model, test_params.device, test_params.numiters);
+        fillBlobs(infer_requests[i], inputsInfo, batchSize);
+        pipeline.push_back(reinfer_request_inference(infer_requests[i], outputs_info[i]));
+    }
+    auto test = [&] {
+        log_info("Inference of InferRequests from networks: " << test_params.model_name << " for \""
+                                                              << test_params.device << "\" device for "
+                                                              << test_params.numiters << " times");
+        return common_test_pipeline(pipeline, test_params.numiters);
     };
     test_runner(test_params.numthreads, test);
 }
 
 TEST_P(MemLeaksTestSuite, infer_request_inference) {
     auto test_params = GetParam();
+    std::vector<std::function<void()>> pipeline;
+    for (int i = 0; i < test_params.models.size(); i++) {
+        pipeline.push_back(infer_request_inference(test_params.models[i]["full_path"], test_params.device));
+    }
     auto test = [&] {
-        return test_infer_request_inference(test_params.model, test_params.device, test_params.numiters);
+        log_info("Inference of InferRequests from networks: " << test_params.model_name << " for \""
+                                                              << test_params.device << "\" device for "
+                                                              << test_params.numiters << " times");
+        return common_test_pipeline(pipeline, test_params.numiters);
     };
     test_runner(test_params.numthreads, test);
 }
 
 TEST_P(MemLeaksTestSuite, inference_with_streams) {
-    const auto nstreams = 2;
     auto test_params = GetParam();
+    const auto nstreams = 2;
+    std::vector<std::function<void()>> pipeline;
+    for (int i = 0; i < test_params.models.size(); i++) {
+        pipeline.push_back(inference_with_streams(test_params.models[i]["full_path"], test_params.device, nstreams));
+    }
     auto test = [&] {
-        return test_inference_with_streams(test_params.model, test_params.device, nstreams, test_params.numiters);
+        log_info("Inference of InferRequests from networks: " << test_params.model_name << " for \""
+                                                              << test_params.device << "\" device with " << nstreams
+                                                              << " streams for " << test_params.numiters << " times");
+        return common_test_pipeline(pipeline, test_params.numiters);
     };
     test_runner(test_params.numthreads, test);
 }
 
 // tests_pipelines/tests_pipelines.cpp
 
-INSTANTIATE_TEST_SUITE_P(MemLeaksTests, MemLeaksTestSuiteNoModel,
-                        ::testing::ValuesIn(generateTestsParams({"processes", "threads", "iterations", "devices"})),
-                        getTestCaseName);
+INSTANTIATE_TEST_SUITE_P(MemLeaksTests, MemLeaksTestSuiteNoModel, ::testing::ValuesIn(generateTestsParamsMemLeaks()),
+                         getTestCaseNameMemLeaks);
 
-INSTANTIATE_TEST_SUITE_P(MemLeaksTests, MemLeaksTestSuiteNoDevice,
-                        ::testing::ValuesIn(generateTestsParams({"processes", "threads", "iterations", "models"})),
-                        getTestCaseName);
-
-INSTANTIATE_TEST_SUITE_P(MemLeaksTests, MemLeaksTestSuite,
-                        ::testing::ValuesIn(
-                                generateTestsParams({"processes", "threads", "iterations", "devices", "models"})),
-                        getTestCaseName);
+INSTANTIATE_TEST_SUITE_P(MemLeaksTests, MemLeaksTestSuiteNoDevice, ::testing::ValuesIn(generateTestsParamsMemLeaks()),
+                         getTestCaseNameMemLeaks);
 
+INSTANTIATE_TEST_SUITE_P(MemLeaksTests, MemLeaksTestSuite, ::testing::ValuesIn(generateTestsParamsMemLeaks()),
+                         getTestCaseNameMemLeaks);
diff --git a/tests/stress_tests/memleaks_tests/tests_pipelines/tests_pipelines.cpp b/tests/stress_tests/memleaks_tests/tests_pipelines/tests_pipelines.cpp
index a4e4aeed190..e670e096315 100644
--- a/tests/stress_tests/memleaks_tests/tests_pipelines/tests_pipelines.cpp
+++ b/tests/stress_tests/memleaks_tests/tests_pipelines/tests_pipelines.cpp
@@ -31,30 +31,30 @@ using namespace InferenceEngine;
 enum MeasureValue { VMRSS = 0, VMHWM, VMSIZE, VMPEAK, THREADS, MeasureValueMax };
 
 namespace util {
-template <typename In, typename Out, typename Func>
-void transform(const In& in, Out& out, const Func& func) {
-    std::transform(std::begin(in), std::end(in), std::begin(out), func);
-}
+    template<typename In, typename Out, typename Func>
+    void transform(const In &in, Out &out, const Func &func) {
+        std::transform(std::begin(in), std::end(in), std::begin(out), func);
+    }
 
-template <typename In1, typename In2, typename Out, typename Func>
-void transform(const In1& in1, const In2& in2, Out& out, const Func& func) {
-    std::transform(std::begin(in1), std::end(in1), std::begin(in2), std::begin(out), func);
-}
-}  // namespace util
+    template<typename In1, typename In2, typename Out, typename Func>
+    void transform(const In1 &in1, const In2 &in2, Out &out, const Func &func) {
+        std::transform(std::begin(in1), std::end(in1), std::begin(in2), std::begin(out), func);
+    }
+}// namespace util
 
-TestResult common_test_pipeline(const std::function<void()>& test_pipeline, const int& n) {
+TestResult common_test_pipeline(std::vector<std::function<void()>> test_pipeline, const int &n) {
     if (AVERAGE_NUM > n)
         return TestResult(TestStatus::TEST_FAILED, "Test failed: number of iterations less than defined AVERAGE_NUM");
 
     int retry_count = 0;
-    std::array<long, MeasureValueMax> cur {};               // measured for current iteration
-    std::array<long, MeasureValueMax> ref = {-1};           // recorded reference
-    std::array<long, MeasureValueMax> diff {};              // difference between current and reference
-    std::array<bool, MeasureValueMax> outlier {};           // flag if current does not fit threshold
-    std::array<int, MeasureValueMax> outlier_count {};      // counter for how many times current does not fit threshold
-    std::array<float, MeasureValueMax> threshold {};        // ref * THRESHOLD
-    std::vector<std::array<long, MeasureValueMax>> past;    // past measures
-    std::array<long, MeasureValueMax> sliding_avg {};       // sliding average computed as avg of past AVERAGE_NUM values
+    std::array<long, MeasureValueMax> cur{};            // measured for current iteration
+    std::array<long, MeasureValueMax> ref = {-1};       // recorded reference
+    std::array<long, MeasureValueMax> diff{};           // difference between current and reference
+    std::array<bool, MeasureValueMax> outlier{};        // flag if current does not fit threshold
+    std::array<int, MeasureValueMax> outlier_count{};   // counter for how many times current does not fit threshold
+    std::array<float, MeasureValueMax> threshold{};     // ref * THRESHOLD
+    std::vector<std::array<long, MeasureValueMax>> past;// past measures
+    std::array<long, MeasureValueMax> sliding_avg{};    // sliding average computed as avg of past AVERAGE_NUM values
     std::string progress_str;
 
     progress_str.reserve(LOG_LINE_RESERVE);
@@ -63,9 +63,9 @@ TestResult common_test_pipeline(const std::function<void()>& test_pipeline, cons
     log_info("Warming up for " << WARMUP_STEPS << " iterations");
     log_info("i\tVMRSS\tVMHWM\tVMSIZE\tVMPEAK\tTHREADS");
 
-    for (size_t iteration = 1, measure_count = n / AVERAGE_NUM; ; iteration++) {
+    for (size_t iteration = 1, measure_count = n / AVERAGE_NUM;; iteration++) {
         // run test pipeline and collect metrics
-        test_pipeline();
+        for (auto step : test_pipeline) step();
         getVmValues(cur[VMSIZE], cur[VMPEAK], cur[VMRSS], cur[VMHWM]);
         cur[THREADS] = getThreadsNum();
 
@@ -77,14 +77,11 @@ TestResult common_test_pipeline(const std::function<void()>& test_pipeline, cons
             for (size_t i = 0; i < AVERAGE_NUM; i++) {
                 // sliding_avg = sliding_avg + past
                 util::transform(sliding_avg, past[i], sliding_avg,
-                                [](long sliding_avg_val, long past_val) -> long {
-                                    return sliding_avg_val + past_val;
-                                });
+                                [](long sliding_avg_val, long past_val) -> long { return sliding_avg_val + past_val; });
             }
             // sliding_avg = sliding_avg / AVERAGE_NUM
-            util::transform(sliding_avg, sliding_avg, [](long sliding_avg_val) -> float {
-                return sliding_avg_val / AVERAGE_NUM;
-            });
+            util::transform(sliding_avg, sliding_avg,
+                            [](long sliding_avg_val) -> float { return sliding_avg_val / AVERAGE_NUM; });
 
             progress_str = std::to_string(iteration) + "\t" + std::to_string(sliding_avg[VMRSS]) + "\t" +
                            std::to_string(sliding_avg[VMHWM]) + "\t" + std::to_string(sliding_avg[VMSIZE]) + "\t" +
@@ -93,9 +90,9 @@ TestResult common_test_pipeline(const std::function<void()>& test_pipeline, cons
             // compute test info
             if (iteration >= WARMUP_STEPS) {
                 // set reference
-                if ((ref == std::array<long, MeasureValueMax> {-1}) ||
-                        (retry_count <= MAX_RETRY &&
-                        (outlier_count[VMRSS] > MAX_OUTLIERS || outlier_count[VMHWM] > MAX_OUTLIERS))) {
+                if ((ref == std::array<long, MeasureValueMax>{-1}) ||
+                    (retry_count <= MAX_RETRY &&
+                     (outlier_count[VMRSS] > MAX_OUTLIERS || outlier_count[VMHWM] > MAX_OUTLIERS))) {
                     if (0 != retry_count) log_info("Retrying " << retry_count << " of " << MAX_RETRY);
 
                     retry_count++;
@@ -104,14 +101,11 @@ TestResult common_test_pipeline(const std::function<void()>& test_pipeline, cons
                     // set reference as current `sliding_avg`
                     ref = sliding_avg;
                     // threshold = THRESHOLD * ref
-                    util::transform(ref, threshold, [](long ref_val) -> float {
-                        return THRESHOLD * ref_val;
-                    });
+                    util::transform(ref, threshold, [](long ref_val) -> float { return THRESHOLD * ref_val; });
                     log_info("Setting thresholds:"
                              << " VMRSS=" << ref[VMRSS] << "(+-" << static_cast<int>(threshold[VMRSS]) << "),"
                              << " VMHWM=" << ref[VMHWM] << "(+-" << static_cast<int>(threshold[VMHWM]) << ")");
-                }
-                else if (measure_count <= 0) {
+                } else if (measure_count <= 0) {
                     // exit from main loop
                     break;
                 }
@@ -123,9 +117,8 @@ TestResult common_test_pipeline(const std::function<void()>& test_pipeline, cons
                     return sliding_avg_val - ref_val;
                 });
                 // outlier = diff > threshold
-                util::transform(diff, threshold, outlier, [](long diff_val, float threshold_val) -> bool {
-                    return diff_val > threshold_val;
-                });
+                util::transform(diff, threshold, outlier,
+                                [](long diff_val, float threshold_val) -> bool { return diff_val > threshold_val; });
                 // outlier_count = outlier_count + (outlier ? 1 : 0)
                 util::transform(outlier, outlier_count, outlier_count,
                                 [](bool outlier_val, long outlier_count_val) -> long {
@@ -147,71 +140,3 @@ TestResult common_test_pipeline(const std::function<void()>& test_pipeline, cons
 
     return TestResult(TestStatus::TEST_OK, "");
 }
-
-TestResult test_load_unload_plugin(const std::string& target_device, const int& n) {
-    log_info("Load/unload plugin for device: " << target_device << " for " << n << " times");
-    return common_test_pipeline(load_unload_plugin(target_device), n);
-}
-
-TestResult test_read_network(const std::string& model, const int& n) {
-    log_info("Read network: \"" << model << "\" for " << n << " times");
-    return common_test_pipeline(read_cnnnetwork(model), n);
-}
-
-TestResult test_cnnnetwork_reshape_batch_x2(const std::string& model, const int& n) {
-    log_info("Reshape to batch*=2 of CNNNetwork created from network: \"" << model << "\" for " << n << " times");
-    return common_test_pipeline(cnnnetwork_reshape_batch_x2(model), n);
-}
-
-TestResult test_set_input_params(const std::string& model, const int& n) {
-    log_info("Apply preprocessing for CNNNetwork from network: \"" << model << "\" for " << n << " times");
-    return common_test_pipeline(set_input_params(model), n);
-}
-
-TestResult test_create_exenetwork(const std::string& model, const std::string& target_device, const int& n) {
-    log_info("Create ExecutableNetwork from network: \"" << model << "\" for device: \"" << target_device << "\" for "
-                                                         << n << " times");
-    return common_test_pipeline(create_exenetwork(model, target_device), n);
-}
-
-TestResult test_recreate_exenetwork(InferenceEngine::Core& ie, const std::string& model,
-                                    const std::string& target_device, const int& n) {
-    log_info("Recreate ExecutableNetwork from network within existing InferenceEngine::Core: \""
-             << model << "\" for device: \"" << target_device << "\" for " << n << " times");
-    return common_test_pipeline(recreate_exenetwork(ie, model, target_device), n);
-}
-
-TestResult test_create_infer_request(const std::string& model, const std::string& target_device, const int& n) {
-    log_info("Create InferRequest from network: \"" << model << "\" for device: \"" << target_device << "\" for " << n
-                                                    << " times");
-    return common_test_pipeline(create_infer_request(model, target_device), n);
-}
-
-TestResult test_recreate_infer_request(ExecutableNetwork& network, const std::string& model,
-                                       const std::string& target_device, const int& n) {
-    log_info("Create InferRequest from network: \"" << model << "\" for device: \"" << target_device << "\" for " << n
-                                                    << " times");
-    return common_test_pipeline(recreate_infer_request(network), n);
-}
-
-TestResult test_infer_request_inference(const std::string& model, const std::string& target_device, const int& n) {
-    log_info("Inference of InferRequest from network: \"" << model << "\" for device: \"" << target_device << "\" for "
-                                                          << n << " times");
-    return common_test_pipeline(infer_request_inference(model, target_device), n);
-}
-
-TestResult test_reinfer_request_inference(InferenceEngine::InferRequest& infer_request,
-                                          InferenceEngine::OutputsDataMap& output_info, const std::string& model,
-                                          const std::string& target_device, const int& n) {
-    log_info("Inference of InferRequest from network: \"" << model << "\" for device: \"" << target_device << "\" for "
-                                                          << n << " times");
-    return common_test_pipeline(reinfer_request_inference(infer_request, output_info), n);
-}
-
-TestResult test_inference_with_streams(const std::string& model, const std::string& target_device,
-                                       const int& nstreams, const int& n) {
-    log_info("Inference of InferRequest from network: \"" << model
-                                                          << "\" for device: \"" << target_device
-                                                          << "\" with streams: " << nstreams << " for " << n << " times");
-    return common_test_pipeline(inference_with_streams(model, target_device, nstreams), n);
-}
diff --git a/tests/stress_tests/memleaks_tests/tests_pipelines/tests_pipelines.h b/tests/stress_tests/memleaks_tests/tests_pipelines/tests_pipelines.h
index 64aee916400..d0c7650b530 100644
--- a/tests/stress_tests/memleaks_tests/tests_pipelines/tests_pipelines.h
+++ b/tests/stress_tests/memleaks_tests/tests_pipelines/tests_pipelines.h
@@ -4,23 +4,14 @@
 
 #pragma once
 
+#include "../../common/ie_pipelines/pipelines.h"
 #include "../../common/tests_utils.h"
 #include "../../common/utils.h"
-#include "../../common/ie_pipelines/pipelines.h"
 
 #include <string>
 
 #include <inference_engine.hpp>
 
 // tests_pipelines/tests_pipelines.cpp
-TestResult test_load_unload_plugin(const std::string &target_device, const int &n);
-TestResult test_read_network(const std::string &model, const int &n);
-TestResult test_cnnnetwork_reshape_batch_x2(const std::string &model, const int &n);
-TestResult test_set_input_params(const std::string &model, const int &n);
-TestResult test_recreate_exenetwork(InferenceEngine::Core &ie, const std::string &model, const std::string &target_device, const int &n);
-TestResult test_create_infer_request(const std::string &model, const std::string &target_device, const int &n);
-TestResult test_recreate_infer_request(InferenceEngine::ExecutableNetwork& network, const std::string &model, const std::string &target_device, const int &n);
-TestResult test_infer_request_inference(const std::string &model, const std::string &target_device, const int &n);
-TestResult test_reinfer_request_inference(InferenceEngine::InferRequest& infer_request, InferenceEngine::OutputsDataMap& output_info, const std::string &model, const std::string &target_device, const int &n);
-TestResult test_inference_with_streams(const std::string &model, const std::string &target_device, const int &nstreams, const int &n);
+TestResult common_test_pipeline(std::vector<std::function<void()>> test_pipeline, const int &n);
 // tests_pipelines/tests_pipelines.cpp
diff --git a/tests/stress_tests/scripts/get_testdata.py b/tests/stress_tests/scripts/get_testdata.py
index b6a50b7bb19..a18c6045d02 100755
--- a/tests/stress_tests/scripts/get_testdata.py
+++ b/tests/stress_tests/scripts/get_testdata.py
@@ -85,6 +85,22 @@ def run_in_subprocess(cmd, check_call=True):
         subprocess.call(cmd, shell=True)
 
 
+def get_model_recs(test_conf_root):
+    """Parse models from test config.
+       Model records in multi-model configs with static test definition are members of "device" sections
+    """
+    device_recs = test_conf_root.findall("device")
+    if device_recs:
+        model_recs = []
+        for device_rec in device_recs:
+            for model_rec in device_rec.findall("model"):
+                model_recs.append(model_rec)
+
+        return model_recs
+
+    return test_conf_root.find("models")
+
+
 def main():
     """Main entry point.
     """
@@ -140,10 +156,11 @@ def main():
         Venv.create_n_install_requirements(*requirements)
         python_executable = Venv.get_venv_executable()
 
-    # parse models from test config
     test_conf_obj = ET.parse(str(args.test_conf))
     test_conf_root = test_conf_obj.getroot()
-    for model_rec in test_conf_root.find("models"):
+    model_recs = get_model_recs(test_conf_root)
+
+    for model_rec in model_recs:
         if "name" not in model_rec.attrib or model_rec.attrib.get("source") != "omz":
             continue
         model_name = model_rec.attrib["name"]
diff --git a/tests/stress_tests/scripts/memcheck-template/timeline_report.html b/tests/stress_tests/scripts/memcheck-template/timeline_report.html
index f2accdb9f01..07ef0d5b0be 100644
--- a/tests/stress_tests/scripts/memcheck-template/timeline_report.html
+++ b/tests/stress_tests/scripts/memcheck-template/timeline_report.html
@@ -13,7 +13,7 @@
 <h2>Memcheck report</h2>
     {% for timeline in timelines %}
     <div class="w3-container">
-        <h4> {{ timeline['device'][0]|e }} {{ timeline['model_name'][0]|e }} {{ timeline['test_name'][0]|e }} </h4>
+        <h4> {{ timeline['device'][0]|e }} - {{ timeline['precision'][0]|e }} - {{ timeline['model_name'][0]|e }} - {{ timeline['test_name'][0]|e }} </h4>
         <div class={{ '"w3-text-green"' if timeline['status'] else '"w3-text-red"' }}>
             {{ "PASS" if timeline['status'] else "FAIL" }}
         </div>
diff --git a/tests/stress_tests/scripts/run_memcheck.py b/tests/stress_tests/scripts/run_memcheck.py
index 561ff1b9127..7ca5cef018f 100755
--- a/tests/stress_tests/scripts/run_memcheck.py
+++ b/tests/stress_tests/scripts/run_memcheck.py
@@ -140,7 +140,7 @@ def main():
         else:
             if list(glob(os.path.join(args.output_dir, '**', '*.log'), recursive=True)):
                 logging.error(
-                    'Output directory %s already has test logs.'
+                    'Output directory %s already has test logs. '
                     'Please specify an empty directory for output logs',
                     args.output_dir)
                 sys.exit(1)
diff --git a/tests/time_tests/README.md b/tests/time_tests/README.md
index 94e3566b7ee..447186ad706 100644
--- a/tests/time_tests/README.md
+++ b/tests/time_tests/README.md
@@ -15,7 +15,7 @@ the commands below:
 
 1. Build tests:
 ``` bash
-source <OpenVINO_install_dir>/bin/setupvars.sh
+source <OpenVINO_install_dir>/setupvars.sh
 mkdir build && cd build
 cmake .. && make time_tests
 ```
diff --git a/thirdparty/CMakeLists.txt b/thirdparty/CMakeLists.txt
index 3924fd21044..4c8e6e3495a 100644
--- a/thirdparty/CMakeLists.txt
+++ b/thirdparty/CMakeLists.txt
@@ -116,6 +116,57 @@ if(NGRAPH_ONNX_FRONTEND_ENABLE)
     add_subdirectory(onnx)
 endif()
 
+#
+# oneDNN for GPU plugin
+#
+if (ANDROID OR (CMAKE_COMPILER_IS_GNUCC AND CMAKE_CXX_COMPILER_VERSION VERSION_LESS 7.0))
+    # oneDNN doesn't support old compilers and android builds for now, so we'll build GPU plugin without oneDNN
+    set(ENABLE_ONEDNN_FOR_GPU OFF CACHE BOOL "")
+else()
+    set(ENABLE_ONEDNN_FOR_GPU ON CACHE BOOL "")
+endif()
+
+if(ENABLE_ONEDNN_FOR_GPU)
+    function(build_onednn_gpu)
+        include(ExternalProject)
+        set(ONEDNN_BUILD_DIR "${CMAKE_CURRENT_BINARY_DIR}/onednn_gpu_build/")
+        set(ONEDNN_INSTALL_DIR "${CMAKE_LIBRARY_OUTPUT_DIRECTORY}")
+        set(ONEDNN_LIBRARY "${ONEDNN_BUILD_DIR}/src/${CMAKE_STATIC_LIBRARY_PREFIX}onednn_gpu${CMAKE_STATIC_LIBRARY_SUFFIX}")
+        set(ONEDNN_OUTPUT_LIBRARY "${ONEDNN_INSTALL_DIR}/${CMAKE_STATIC_LIBRARY_PREFIX}onednn_gpu${CMAKE_STATIC_LIBRARY_SUFFIX}")
+        ExternalProject_Add(onednn_gpu_build
+            SOURCE_DIR "${CMAKE_CURRENT_SOURCE_DIR}/onednn_gpu"
+            BINARY_DIR "${ONEDNN_BUILD_DIR}"
+            INSTALL_DIR "${ONEDNN_INSTALL_DIR}"
+            PREFIX onednn_gpu_build
+            EXCLUDE_FROM_ALL ON
+            CMAKE_ARGS "-DCMAKE_CXX_COMPILER=${CMAKE_CXX_COMPILER}"
+                       "-DCMAKE_C_COMPILER=${CMAKE_C_COMPILER}"
+                       "-DDNNL_CPU_RUNTIME=NONE"
+                       "-DDNNL_GPU_RUNTIME=OCL"
+                       "-DDNNL_GPU_RUNTIME=OCL"
+                       "-DDNNL_LIBRARY_NAME=onednn_gpu"
+                       "-DCMAKE_BUILD_TYPE=${CMAKE_BUILD_TYPE}"
+                       "-DCMAKE_RUNTIME_OUTPUT_DIRECTORY=${CMAKE_RUNTIME_OUTPUT_DIRECTORY}"
+                       "-DCMAKE_LIBRARY_OUTPUT_DIRECTORY=${CMAKE_LIBRARY_OUTPUT_DIRECTORY}"
+                       "-DDNNL_ENABLE_CONCURRENT_EXEC=ON"
+                       "-DDNNL_ENABLE_PRIMITIVE_CACHE=ON"
+                       "-DDNNL_BUILD_TESTS=OFF"
+                       "-DDNNL_BUILD_EXAMPLES=OFF"
+                       "-DDNNL_BLAS_VENDOR=NONE"
+                       "-DDNNL_LIBRARY_TYPE=STATIC"
+                       "-DOpenCL_LIBRARY=${OpenCL_LIBRARY}"
+                       "-DOpenCL_INCLUDE_DIR=${OpenCL_INCLUDE_DIR}"
+                       "-DOPENCL_VERSION_2_2=${OPENCL_VERSION_2_2}"
+            BUILD_COMMAND ${CMAKE_COMMAND} --build . --config ${CMAKE_BUILD_TYPE} --target onednn_gpu --parallel
+            INSTALL_COMMAND ${CMAKE_COMMAND} -E copy ${ONEDNN_LIBRARY} ${ONEDNN_OUTPUT_LIBRARY}
+            COMMAND ${CMAKE_COMMAND} -E echo "OneDNN $<CONFIG> build for GPU complete"
+            BUILD_BYPRODUCTS ${ONEDNN_OUTPUT_LIBRARY}
+        )
+    endfunction()
+
+    build_onednn_gpu()
+endif()
+
 #
 # Install
 #
diff --git a/thirdparty/ocl/CMakeLists.txt b/thirdparty/ocl/CMakeLists.txt
index d091cc3f54d..6fb15435d5a 100644
--- a/thirdparty/ocl/CMakeLists.txt
+++ b/thirdparty/ocl/CMakeLists.txt
@@ -2,6 +2,40 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
+if(NOT ENABLE_CLDNN)
+    return()
+endif()
+
+function(get_lib_name TARGET_NAME LIBRARY_NAME)
+    if (CMAKE_BUILD_TYPE STREQUAL "Debug")
+        set(BUILD_SUFFIX ${IE_DEBUG_POSTFIX})
+    else()
+        set(BUILD_SUFFIX ${IE_RELEASE_POSTFIX})
+    endif()
+
+    if(WIN32)
+        set(LIB_SUFFIX "${BUILD_SUFFIX}${CMAKE_LINK_LIBRARY_SUFFIX}")
+    else()
+        set(LIB_SUFFIX "${BUILD_SUFFIX}${CMAKE_SHARED_LIBRARY_SUFFIX}")
+    endif()
+
+    set("${LIBRARY_NAME}" "${CMAKE_SHARED_MODULE_PREFIX}${TARGET_NAME}${LIB_SUFFIX}" PARENT_SCOPE)
+endfunction()
+
+function(get_lib_path OUTPUT_DIR FINAL_OUTPUT_DIR)
+    if(WIN32)
+        set(LIB_DIR "")
+    else()
+        set(LIB_DIR "lib")
+    endif()
+
+    if (NOT CMAKE_GENERATOR MATCHES "Ninja" AND NOT UNIX)
+        set(OUTPUT_DIR "${OUTPUT_DIR}/${CMAKE_BUILD_TYPE}")
+    endif()
+
+    set("${FINAL_OUTPUT_DIR}" "${OUTPUT_DIR}/${LIB_DIR}" PARENT_SCOPE)
+endfunction()
+
 set(OPENCL_ICD_LOADER_HEADERS_DIR "${CMAKE_CURRENT_SOURCE_DIR}/cl_headers/" CACHE PATH "Path to OCL includes" FORCE)
 
 set(OPENCL_HEADERS_DIR "${CMAKE_CURRENT_SOURCE_DIR}/cl_headers/" "${CMAKE_CURRENT_SOURCE_DIR}/clhpp_headers/include/" CACHE PATH "Path to OCL (CL and CLHPP) includes" FORCE)
@@ -19,6 +53,12 @@ add_subdirectory(icd_loader)
 target_include_directories(OpenCL SYSTEM PUBLIC ${OPENCL_HEADERS_DIR})
 
 # The following varables are needed to make find_package(OpenCL) work
+set(OPENCL_VERSION_2_2 ON CACHE BOOL "" FORCE)
 set(OpenCL_VERSION_STRING "2.2" CACHE STRING "" FORCE)
-set(OpenCL_INCLUDE_DIR "${OPENCL_ICD_LOADER_HEADERS_DIR}" CACHE PATH "" FORCE)
+set(OpenCL_INCLUDE_DIR "${OPENCL_HEADERS_DIR}" CACHE PATH "" FORCE)
 set(OPENCLROOT "${CMAKE_LIBRARY_OUTPUT_DIRECTORY}" CACHE PATH "" FORCE)
+
+get_lib_path("${OUTPUT_ROOT}/${BIN_FOLDER}" OPENCL_LIB_DIR)
+get_lib_name("OpenCL" OPENCL_LIB_NAME)
+
+set(OpenCL_LIBRARY "${OPENCL_LIB_DIR}/${OPENCL_LIB_NAME}" CACHE PATH "" FORCE)
diff --git a/thirdparty/onednn_gpu b/thirdparty/onednn_gpu
new file mode 160000
index 00000000000..1b48f27ee03
--- /dev/null
+++ b/thirdparty/onednn_gpu
@@ -0,0 +1 @@
+Subproject commit 1b48f27ee0350a53926bf069bf0b72ae2d0eee14
diff --git a/tools/benchmark_tool/openvino/tools/benchmark/main.py b/tools/benchmark_tool/openvino/tools/benchmark/main.py
index df39b1f037f..4e10f54e8d4 100644
--- a/tools/benchmark_tool/openvino/tools/benchmark/main.py
+++ b/tools/benchmark_tool/openvino/tools/benchmark/main.py
@@ -126,7 +126,7 @@ def run(args):
                 elif key not in config[device].keys() and args.api_type == "async" and not is_flag_set_in_command_line('hint'):
                     ## set the _AUTO value for the #streams
                     logger.warning(f"-nstreams default value is determined automatically for {device} device. " +
-                                   "Although the automatic selection usually provides a reasonable performance,"
+                                   "Although the automatic selection usually provides a reasonable performance, "
                                    "but it still may be non-optimal for some cases, for more information look at README.")
                     if device != MYRIAD_DEVICE_NAME:  ## MYRIAD sets the default number of streams implicitly
                         config[device][key] = device + "_THROUGHPUT_AUTO"
diff --git a/tools/benchmark_tool/openvino/tools/benchmark/parameters.py b/tools/benchmark_tool/openvino/tools/benchmark/parameters.py
index 9970b2b9725..89a3c6283dc 100644
--- a/tools/benchmark_tool/openvino/tools/benchmark/parameters.py
+++ b/tools/benchmark_tool/openvino/tools/benchmark/parameters.py
@@ -49,9 +49,9 @@ def parse_args():
                       help='Optional. Required for GPU custom kernels. Absolute path to an .xml file with the '
                            'kernels description.')
     args.add_argument('-hint', '--perf_hint', type=str, required=False, default='', choices=['throughput', 'latency'],
-                      help='Optional. Performance hint (optimize for latency or throughput).'
-                            'The hint allows the OpenVINO device to select the right network-specific settings,'
-                            'as opposite to accepting specific values like  \'nstreams\' from the command line.'
+                      help='Optional. Performance hint (optimize for latency or throughput). '
+                            'The hint allows the OpenVINO device to select the right network-specific settings, '
+                            'as opposite to accepting specific values like  \'nstreams\' from the command line. '
                             'So you can specify just the hint without adding explicit device-specific options')
     args.add_argument('-api', '--api_type', type=str, required=False, default='async', choices=['sync', 'async'],
                       help='Optional. Enable using sync/async API. Default value is async.')
@@ -101,8 +101,8 @@ def parse_args():
     args.add_argument('-pin', '--infer_threads_pinning', type=str, required=False,  choices=['YES', 'NO', 'NUMA', 'HYBRID_AWARE'],
                       help='Optional. Enable  threads->cores (\'YES\' which is OpenVINO runtime\'s default for conventional CPUs), '
                            'threads->(NUMA)nodes (\'NUMA\'), '
-                           'threads->appropriate core types (\'HYBRID_AWARE\', which is OpenVINO runtime\'s default for Hybrid CPUs)'
-                           'or completely disable (\'NO\')'
+                           'threads->appropriate core types (\'HYBRID_AWARE\', which is OpenVINO runtime\'s default for Hybrid CPUs) '
+                           'or completely disable (\'NO\') '
                            'CPU threads pinning for CPU-involved inference.')
     args.add_argument('-exec_graph_path', '--exec_graph_path', type=str, required=False,
                       help='Optional. Path to a file where to store executable graph information serialized.')
diff --git a/tools/deployment_manager/configs/darwin.json b/tools/deployment_manager/configs/darwin.json
index 452b14c0ef4..bedec06697a 100644
--- a/tools/deployment_manager/configs/darwin.json
+++ b/tools/deployment_manager/configs/darwin.json
@@ -19,7 +19,6 @@
         "runtime/lib/intel64/libinference_engine.dylib",
         "runtime/lib/intel64/libinference_engine_transformations.dylib",
         "runtime/lib/intel64/libinference_engine_preproc.so",
-        "runtime/lib/intel64/libinference_engine_ir_reader.so",
         "runtime/lib/intel64/libinference_engine_c_api.dylib",
         "runtime/lib/intel64/libHeteroPlugin.so",
         "runtime/lib/intel64/libMultiDevicePlugin.so",
diff --git a/tools/deployment_manager/configs/linux.json b/tools/deployment_manager/configs/linux.json
index 29912e3ff3e..181e5116554 100644
--- a/tools/deployment_manager/configs/linux.json
+++ b/tools/deployment_manager/configs/linux.json
@@ -25,7 +25,6 @@
         "runtime/lib/intel64/libinference_engine.so",
         "runtime/lib/intel64/libinference_engine_transformations.so",
         "runtime/lib/intel64/libinference_engine_preproc.so",
-        "runtime/lib/intel64/libinference_engine_ir_reader.so",
         "runtime/lib/intel64/libinference_engine_c_api.so",
         "runtime/lib/intel64/libHeteroPlugin.so",
         "runtime/lib/intel64/libMultiDevicePlugin.so",
diff --git a/tools/deployment_manager/configs/windows.json b/tools/deployment_manager/configs/windows.json
index f49d9d3b16a..71eedada1de 100644
--- a/tools/deployment_manager/configs/windows.json
+++ b/tools/deployment_manager/configs/windows.json
@@ -19,7 +19,6 @@
         "runtime/bin/intel64/Release/inference_engine.dll",
         "runtime/bin/intel64/Release/inference_engine_transformations.dll",
         "runtime/bin/intel64/Release/inference_engine_preproc.dll",
-        "runtime/bin/intel64/Release/inference_engine_ir_reader.dll",
         "runtime/bin/intel64/Release/inference_engine_c_api.dll",
         "runtime/bin/intel64/Release/HeteroPlugin.dll",
         "runtime/bin/intel64/Release/MultiDevicePlugin.dll",
diff --git a/tools/deployment_manager/deployman/main.py b/tools/deployment_manager/deployman/main.py
index c87037244f6..b4a46d1ba81 100644
--- a/tools/deployment_manager/deployman/main.py
+++ b/tools/deployment_manager/deployman/main.py
@@ -183,7 +183,7 @@ def main():
 
     parser = argparse.ArgumentParser(description="", formatter_class=argparse.RawTextHelpFormatter)
 
-    parser.add_argument("--targets", nargs="+", help="List of targets."
+    parser.add_argument("--targets", nargs="+", help="List of targets. "
                                                      "Possible values: \n{}".format(help_msg))
     parser.add_argument("--user_data", type=str, help="Path to user data that will be added to "
                                                       "the deployment package", default=None)